xref: /openbmc/linux/drivers/dma/dmatest.c (revision df2634f43f5106947f3735a0b61a6527a4b278cd)
1 /*
2  * DMA Engine test module
3  *
4  * Copyright (C) 2007 Atmel Corporation
5  *
6  * This program is free software; you can redistribute it and/or modify
7  * it under the terms of the GNU General Public License version 2 as
8  * published by the Free Software Foundation.
9  */
10 #include <linux/delay.h>
11 #include <linux/dmaengine.h>
12 #include <linux/init.h>
13 #include <linux/kthread.h>
14 #include <linux/module.h>
15 #include <linux/moduleparam.h>
16 #include <linux/random.h>
17 #include <linux/slab.h>
18 #include <linux/wait.h>
19 
20 static unsigned int test_buf_size = 16384;
21 module_param(test_buf_size, uint, S_IRUGO);
22 MODULE_PARM_DESC(test_buf_size, "Size of the memcpy test buffer");
23 
24 static char test_channel[20];
25 module_param_string(channel, test_channel, sizeof(test_channel), S_IRUGO);
26 MODULE_PARM_DESC(channel, "Bus ID of the channel to test (default: any)");
27 
28 static char test_device[20];
29 module_param_string(device, test_device, sizeof(test_device), S_IRUGO);
30 MODULE_PARM_DESC(device, "Bus ID of the DMA Engine to test (default: any)");
31 
32 static unsigned int threads_per_chan = 1;
33 module_param(threads_per_chan, uint, S_IRUGO);
34 MODULE_PARM_DESC(threads_per_chan,
35 		"Number of threads to start per channel (default: 1)");
36 
37 static unsigned int max_channels;
38 module_param(max_channels, uint, S_IRUGO);
39 MODULE_PARM_DESC(max_channels,
40 		"Maximum number of channels to use (default: all)");
41 
42 static unsigned int iterations;
43 module_param(iterations, uint, S_IRUGO);
44 MODULE_PARM_DESC(iterations,
45 		"Iterations before stopping test (default: infinite)");
46 
47 static unsigned int xor_sources = 3;
48 module_param(xor_sources, uint, S_IRUGO);
49 MODULE_PARM_DESC(xor_sources,
50 		"Number of xor source buffers (default: 3)");
51 
52 static unsigned int pq_sources = 3;
53 module_param(pq_sources, uint, S_IRUGO);
54 MODULE_PARM_DESC(pq_sources,
55 		"Number of p+q source buffers (default: 3)");
56 
57 /*
58  * Initialization patterns. All bytes in the source buffer has bit 7
59  * set, all bytes in the destination buffer has bit 7 cleared.
60  *
61  * Bit 6 is set for all bytes which are to be copied by the DMA
62  * engine. Bit 5 is set for all bytes which are to be overwritten by
63  * the DMA engine.
64  *
65  * The remaining bits are the inverse of a counter which increments by
66  * one for each byte address.
67  */
68 #define PATTERN_SRC		0x80
69 #define PATTERN_DST		0x00
70 #define PATTERN_COPY		0x40
71 #define PATTERN_OVERWRITE	0x20
72 #define PATTERN_COUNT_MASK	0x1f
73 
74 struct dmatest_thread {
75 	struct list_head	node;
76 	struct task_struct	*task;
77 	struct dma_chan		*chan;
78 	u8			**srcs;
79 	u8			**dsts;
80 	enum dma_transaction_type type;
81 };
82 
83 struct dmatest_chan {
84 	struct list_head	node;
85 	struct dma_chan		*chan;
86 	struct list_head	threads;
87 };
88 
89 /*
90  * These are protected by dma_list_mutex since they're only used by
91  * the DMA filter function callback
92  */
93 static LIST_HEAD(dmatest_channels);
94 static unsigned int nr_channels;
95 
96 static bool dmatest_match_channel(struct dma_chan *chan)
97 {
98 	if (test_channel[0] == '\0')
99 		return true;
100 	return strcmp(dma_chan_name(chan), test_channel) == 0;
101 }
102 
103 static bool dmatest_match_device(struct dma_device *device)
104 {
105 	if (test_device[0] == '\0')
106 		return true;
107 	return strcmp(dev_name(device->dev), test_device) == 0;
108 }
109 
110 static unsigned long dmatest_random(void)
111 {
112 	unsigned long buf;
113 
114 	get_random_bytes(&buf, sizeof(buf));
115 	return buf;
116 }
117 
118 static void dmatest_init_srcs(u8 **bufs, unsigned int start, unsigned int len)
119 {
120 	unsigned int i;
121 	u8 *buf;
122 
123 	for (; (buf = *bufs); bufs++) {
124 		for (i = 0; i < start; i++)
125 			buf[i] = PATTERN_SRC | (~i & PATTERN_COUNT_MASK);
126 		for ( ; i < start + len; i++)
127 			buf[i] = PATTERN_SRC | PATTERN_COPY
128 				| (~i & PATTERN_COUNT_MASK);
129 		for ( ; i < test_buf_size; i++)
130 			buf[i] = PATTERN_SRC | (~i & PATTERN_COUNT_MASK);
131 		buf++;
132 	}
133 }
134 
135 static void dmatest_init_dsts(u8 **bufs, unsigned int start, unsigned int len)
136 {
137 	unsigned int i;
138 	u8 *buf;
139 
140 	for (; (buf = *bufs); bufs++) {
141 		for (i = 0; i < start; i++)
142 			buf[i] = PATTERN_DST | (~i & PATTERN_COUNT_MASK);
143 		for ( ; i < start + len; i++)
144 			buf[i] = PATTERN_DST | PATTERN_OVERWRITE
145 				| (~i & PATTERN_COUNT_MASK);
146 		for ( ; i < test_buf_size; i++)
147 			buf[i] = PATTERN_DST | (~i & PATTERN_COUNT_MASK);
148 	}
149 }
150 
151 static void dmatest_mismatch(u8 actual, u8 pattern, unsigned int index,
152 		unsigned int counter, bool is_srcbuf)
153 {
154 	u8		diff = actual ^ pattern;
155 	u8		expected = pattern | (~counter & PATTERN_COUNT_MASK);
156 	const char	*thread_name = current->comm;
157 
158 	if (is_srcbuf)
159 		pr_warning("%s: srcbuf[0x%x] overwritten!"
160 				" Expected %02x, got %02x\n",
161 				thread_name, index, expected, actual);
162 	else if ((pattern & PATTERN_COPY)
163 			&& (diff & (PATTERN_COPY | PATTERN_OVERWRITE)))
164 		pr_warning("%s: dstbuf[0x%x] not copied!"
165 				" Expected %02x, got %02x\n",
166 				thread_name, index, expected, actual);
167 	else if (diff & PATTERN_SRC)
168 		pr_warning("%s: dstbuf[0x%x] was copied!"
169 				" Expected %02x, got %02x\n",
170 				thread_name, index, expected, actual);
171 	else
172 		pr_warning("%s: dstbuf[0x%x] mismatch!"
173 				" Expected %02x, got %02x\n",
174 				thread_name, index, expected, actual);
175 }
176 
177 static unsigned int dmatest_verify(u8 **bufs, unsigned int start,
178 		unsigned int end, unsigned int counter, u8 pattern,
179 		bool is_srcbuf)
180 {
181 	unsigned int i;
182 	unsigned int error_count = 0;
183 	u8 actual;
184 	u8 expected;
185 	u8 *buf;
186 	unsigned int counter_orig = counter;
187 
188 	for (; (buf = *bufs); bufs++) {
189 		counter = counter_orig;
190 		for (i = start; i < end; i++) {
191 			actual = buf[i];
192 			expected = pattern | (~counter & PATTERN_COUNT_MASK);
193 			if (actual != expected) {
194 				if (error_count < 32)
195 					dmatest_mismatch(actual, pattern, i,
196 							 counter, is_srcbuf);
197 				error_count++;
198 			}
199 			counter++;
200 		}
201 	}
202 
203 	if (error_count > 32)
204 		pr_warning("%s: %u errors suppressed\n",
205 			current->comm, error_count - 32);
206 
207 	return error_count;
208 }
209 
210 static void dmatest_callback(void *completion)
211 {
212 	complete(completion);
213 }
214 
215 /*
216  * This function repeatedly tests DMA transfers of various lengths and
217  * offsets for a given operation type until it is told to exit by
218  * kthread_stop(). There may be multiple threads running this function
219  * in parallel for a single channel, and there may be multiple channels
220  * being tested in parallel.
221  *
222  * Before each test, the source and destination buffer is initialized
223  * with a known pattern. This pattern is different depending on
224  * whether it's in an area which is supposed to be copied or
225  * overwritten, and different in the source and destination buffers.
226  * So if the DMA engine doesn't copy exactly what we tell it to copy,
227  * we'll notice.
228  */
229 static int dmatest_func(void *data)
230 {
231 	struct dmatest_thread	*thread = data;
232 	struct dma_chan		*chan;
233 	const char		*thread_name;
234 	unsigned int		src_off, dst_off, len;
235 	unsigned int		error_count;
236 	unsigned int		failed_tests = 0;
237 	unsigned int		total_tests = 0;
238 	dma_cookie_t		cookie;
239 	enum dma_status		status;
240 	enum dma_ctrl_flags 	flags;
241 	u8			pq_coefs[pq_sources + 1];
242 	int			ret;
243 	int			src_cnt;
244 	int			dst_cnt;
245 	int			i;
246 
247 	thread_name = current->comm;
248 
249 	ret = -ENOMEM;
250 
251 	smp_rmb();
252 	chan = thread->chan;
253 	if (thread->type == DMA_MEMCPY)
254 		src_cnt = dst_cnt = 1;
255 	else if (thread->type == DMA_XOR) {
256 		src_cnt = xor_sources | 1; /* force odd to ensure dst = src */
257 		dst_cnt = 1;
258 	} else if (thread->type == DMA_PQ) {
259 		src_cnt = pq_sources | 1; /* force odd to ensure dst = src */
260 		dst_cnt = 2;
261 		for (i = 0; i < src_cnt; i++)
262 			pq_coefs[i] = 1;
263 	} else
264 		goto err_srcs;
265 
266 	thread->srcs = kcalloc(src_cnt+1, sizeof(u8 *), GFP_KERNEL);
267 	if (!thread->srcs)
268 		goto err_srcs;
269 	for (i = 0; i < src_cnt; i++) {
270 		thread->srcs[i] = kmalloc(test_buf_size, GFP_KERNEL);
271 		if (!thread->srcs[i])
272 			goto err_srcbuf;
273 	}
274 	thread->srcs[i] = NULL;
275 
276 	thread->dsts = kcalloc(dst_cnt+1, sizeof(u8 *), GFP_KERNEL);
277 	if (!thread->dsts)
278 		goto err_dsts;
279 	for (i = 0; i < dst_cnt; i++) {
280 		thread->dsts[i] = kmalloc(test_buf_size, GFP_KERNEL);
281 		if (!thread->dsts[i])
282 			goto err_dstbuf;
283 	}
284 	thread->dsts[i] = NULL;
285 
286 	set_user_nice(current, 10);
287 
288 	flags = DMA_CTRL_ACK | DMA_COMPL_SKIP_DEST_UNMAP | DMA_PREP_INTERRUPT;
289 
290 	while (!kthread_should_stop()
291 	       && !(iterations && total_tests >= iterations)) {
292 		struct dma_device *dev = chan->device;
293 		struct dma_async_tx_descriptor *tx = NULL;
294 		dma_addr_t dma_srcs[src_cnt];
295 		dma_addr_t dma_dsts[dst_cnt];
296 		struct completion cmp;
297 		unsigned long tmo = msecs_to_jiffies(3000);
298 		u8 align = 0;
299 
300 		total_tests++;
301 
302 		/* honor alignment restrictions */
303 		if (thread->type == DMA_MEMCPY)
304 			align = dev->copy_align;
305 		else if (thread->type == DMA_XOR)
306 			align = dev->xor_align;
307 		else if (thread->type == DMA_PQ)
308 			align = dev->pq_align;
309 
310 		if (1 << align > test_buf_size) {
311 			pr_err("%u-byte buffer too small for %d-byte alignment\n",
312 			       test_buf_size, 1 << align);
313 			break;
314 		}
315 
316 		len = dmatest_random() % test_buf_size + 1;
317 		len = (len >> align) << align;
318 		if (!len)
319 			len = 1 << align;
320 		src_off = dmatest_random() % (test_buf_size - len + 1);
321 		dst_off = dmatest_random() % (test_buf_size - len + 1);
322 
323 		src_off = (src_off >> align) << align;
324 		dst_off = (dst_off >> align) << align;
325 
326 		dmatest_init_srcs(thread->srcs, src_off, len);
327 		dmatest_init_dsts(thread->dsts, dst_off, len);
328 
329 		for (i = 0; i < src_cnt; i++) {
330 			u8 *buf = thread->srcs[i] + src_off;
331 
332 			dma_srcs[i] = dma_map_single(dev->dev, buf, len,
333 						     DMA_TO_DEVICE);
334 		}
335 		/* map with DMA_BIDIRECTIONAL to force writeback/invalidate */
336 		for (i = 0; i < dst_cnt; i++) {
337 			dma_dsts[i] = dma_map_single(dev->dev, thread->dsts[i],
338 						     test_buf_size,
339 						     DMA_BIDIRECTIONAL);
340 		}
341 
342 
343 		if (thread->type == DMA_MEMCPY)
344 			tx = dev->device_prep_dma_memcpy(chan,
345 							 dma_dsts[0] + dst_off,
346 							 dma_srcs[0], len,
347 							 flags);
348 		else if (thread->type == DMA_XOR)
349 			tx = dev->device_prep_dma_xor(chan,
350 						      dma_dsts[0] + dst_off,
351 						      dma_srcs, src_cnt,
352 						      len, flags);
353 		else if (thread->type == DMA_PQ) {
354 			dma_addr_t dma_pq[dst_cnt];
355 
356 			for (i = 0; i < dst_cnt; i++)
357 				dma_pq[i] = dma_dsts[i] + dst_off;
358 			tx = dev->device_prep_dma_pq(chan, dma_pq, dma_srcs,
359 						     src_cnt, pq_coefs,
360 						     len, flags);
361 		}
362 
363 		if (!tx) {
364 			for (i = 0; i < src_cnt; i++)
365 				dma_unmap_single(dev->dev, dma_srcs[i], len,
366 						 DMA_TO_DEVICE);
367 			for (i = 0; i < dst_cnt; i++)
368 				dma_unmap_single(dev->dev, dma_dsts[i],
369 						 test_buf_size,
370 						 DMA_BIDIRECTIONAL);
371 			pr_warning("%s: #%u: prep error with src_off=0x%x "
372 					"dst_off=0x%x len=0x%x\n",
373 					thread_name, total_tests - 1,
374 					src_off, dst_off, len);
375 			msleep(100);
376 			failed_tests++;
377 			continue;
378 		}
379 
380 		init_completion(&cmp);
381 		tx->callback = dmatest_callback;
382 		tx->callback_param = &cmp;
383 		cookie = tx->tx_submit(tx);
384 
385 		if (dma_submit_error(cookie)) {
386 			pr_warning("%s: #%u: submit error %d with src_off=0x%x "
387 					"dst_off=0x%x len=0x%x\n",
388 					thread_name, total_tests - 1, cookie,
389 					src_off, dst_off, len);
390 			msleep(100);
391 			failed_tests++;
392 			continue;
393 		}
394 		dma_async_issue_pending(chan);
395 
396 		tmo = wait_for_completion_timeout(&cmp, tmo);
397 		status = dma_async_is_tx_complete(chan, cookie, NULL, NULL);
398 
399 		if (tmo == 0) {
400 			pr_warning("%s: #%u: test timed out\n",
401 				   thread_name, total_tests - 1);
402 			failed_tests++;
403 			continue;
404 		} else if (status != DMA_SUCCESS) {
405 			pr_warning("%s: #%u: got completion callback,"
406 				   " but status is \'%s\'\n",
407 				   thread_name, total_tests - 1,
408 				   status == DMA_ERROR ? "error" : "in progress");
409 			failed_tests++;
410 			continue;
411 		}
412 
413 		/* Unmap by myself (see DMA_COMPL_SKIP_DEST_UNMAP above) */
414 		for (i = 0; i < dst_cnt; i++)
415 			dma_unmap_single(dev->dev, dma_dsts[i], test_buf_size,
416 					 DMA_BIDIRECTIONAL);
417 
418 		error_count = 0;
419 
420 		pr_debug("%s: verifying source buffer...\n", thread_name);
421 		error_count += dmatest_verify(thread->srcs, 0, src_off,
422 				0, PATTERN_SRC, true);
423 		error_count += dmatest_verify(thread->srcs, src_off,
424 				src_off + len, src_off,
425 				PATTERN_SRC | PATTERN_COPY, true);
426 		error_count += dmatest_verify(thread->srcs, src_off + len,
427 				test_buf_size, src_off + len,
428 				PATTERN_SRC, true);
429 
430 		pr_debug("%s: verifying dest buffer...\n",
431 				thread->task->comm);
432 		error_count += dmatest_verify(thread->dsts, 0, dst_off,
433 				0, PATTERN_DST, false);
434 		error_count += dmatest_verify(thread->dsts, dst_off,
435 				dst_off + len, src_off,
436 				PATTERN_SRC | PATTERN_COPY, false);
437 		error_count += dmatest_verify(thread->dsts, dst_off + len,
438 				test_buf_size, dst_off + len,
439 				PATTERN_DST, false);
440 
441 		if (error_count) {
442 			pr_warning("%s: #%u: %u errors with "
443 				"src_off=0x%x dst_off=0x%x len=0x%x\n",
444 				thread_name, total_tests - 1, error_count,
445 				src_off, dst_off, len);
446 			failed_tests++;
447 		} else {
448 			pr_debug("%s: #%u: No errors with "
449 				"src_off=0x%x dst_off=0x%x len=0x%x\n",
450 				thread_name, total_tests - 1,
451 				src_off, dst_off, len);
452 		}
453 	}
454 
455 	ret = 0;
456 	for (i = 0; thread->dsts[i]; i++)
457 		kfree(thread->dsts[i]);
458 err_dstbuf:
459 	kfree(thread->dsts);
460 err_dsts:
461 	for (i = 0; thread->srcs[i]; i++)
462 		kfree(thread->srcs[i]);
463 err_srcbuf:
464 	kfree(thread->srcs);
465 err_srcs:
466 	pr_notice("%s: terminating after %u tests, %u failures (status %d)\n",
467 			thread_name, total_tests, failed_tests, ret);
468 
469 	if (iterations > 0)
470 		while (!kthread_should_stop()) {
471 			DECLARE_WAIT_QUEUE_HEAD_ONSTACK(wait_dmatest_exit);
472 			interruptible_sleep_on(&wait_dmatest_exit);
473 		}
474 
475 	return ret;
476 }
477 
478 static void dmatest_cleanup_channel(struct dmatest_chan *dtc)
479 {
480 	struct dmatest_thread	*thread;
481 	struct dmatest_thread	*_thread;
482 	int			ret;
483 
484 	list_for_each_entry_safe(thread, _thread, &dtc->threads, node) {
485 		ret = kthread_stop(thread->task);
486 		pr_debug("dmatest: thread %s exited with status %d\n",
487 				thread->task->comm, ret);
488 		list_del(&thread->node);
489 		kfree(thread);
490 	}
491 	kfree(dtc);
492 }
493 
494 static int dmatest_add_threads(struct dmatest_chan *dtc, enum dma_transaction_type type)
495 {
496 	struct dmatest_thread *thread;
497 	struct dma_chan *chan = dtc->chan;
498 	char *op;
499 	unsigned int i;
500 
501 	if (type == DMA_MEMCPY)
502 		op = "copy";
503 	else if (type == DMA_XOR)
504 		op = "xor";
505 	else if (type == DMA_PQ)
506 		op = "pq";
507 	else
508 		return -EINVAL;
509 
510 	for (i = 0; i < threads_per_chan; i++) {
511 		thread = kzalloc(sizeof(struct dmatest_thread), GFP_KERNEL);
512 		if (!thread) {
513 			pr_warning("dmatest: No memory for %s-%s%u\n",
514 				   dma_chan_name(chan), op, i);
515 
516 			break;
517 		}
518 		thread->chan = dtc->chan;
519 		thread->type = type;
520 		smp_wmb();
521 		thread->task = kthread_run(dmatest_func, thread, "%s-%s%u",
522 				dma_chan_name(chan), op, i);
523 		if (IS_ERR(thread->task)) {
524 			pr_warning("dmatest: Failed to run thread %s-%s%u\n",
525 					dma_chan_name(chan), op, i);
526 			kfree(thread);
527 			break;
528 		}
529 
530 		/* srcbuf and dstbuf are allocated by the thread itself */
531 
532 		list_add_tail(&thread->node, &dtc->threads);
533 	}
534 
535 	return i;
536 }
537 
538 static int dmatest_add_channel(struct dma_chan *chan)
539 {
540 	struct dmatest_chan	*dtc;
541 	struct dma_device	*dma_dev = chan->device;
542 	unsigned int		thread_count = 0;
543 	int cnt;
544 
545 	dtc = kmalloc(sizeof(struct dmatest_chan), GFP_KERNEL);
546 	if (!dtc) {
547 		pr_warning("dmatest: No memory for %s\n", dma_chan_name(chan));
548 		return -ENOMEM;
549 	}
550 
551 	dtc->chan = chan;
552 	INIT_LIST_HEAD(&dtc->threads);
553 
554 	if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask)) {
555 		cnt = dmatest_add_threads(dtc, DMA_MEMCPY);
556 		thread_count += cnt > 0 ? cnt : 0;
557 	}
558 	if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
559 		cnt = dmatest_add_threads(dtc, DMA_XOR);
560 		thread_count += cnt > 0 ? cnt : 0;
561 	}
562 	if (dma_has_cap(DMA_PQ, dma_dev->cap_mask)) {
563 		cnt = dmatest_add_threads(dtc, DMA_PQ);
564 		thread_count += cnt > 0 ?: 0;
565 	}
566 
567 	pr_info("dmatest: Started %u threads using %s\n",
568 		thread_count, dma_chan_name(chan));
569 
570 	list_add_tail(&dtc->node, &dmatest_channels);
571 	nr_channels++;
572 
573 	return 0;
574 }
575 
576 static bool filter(struct dma_chan *chan, void *param)
577 {
578 	if (!dmatest_match_channel(chan) || !dmatest_match_device(chan->device))
579 		return false;
580 	else
581 		return true;
582 }
583 
584 static int __init dmatest_init(void)
585 {
586 	dma_cap_mask_t mask;
587 	struct dma_chan *chan;
588 	int err = 0;
589 
590 	dma_cap_zero(mask);
591 	dma_cap_set(DMA_MEMCPY, mask);
592 	for (;;) {
593 		chan = dma_request_channel(mask, filter, NULL);
594 		if (chan) {
595 			err = dmatest_add_channel(chan);
596 			if (err) {
597 				dma_release_channel(chan);
598 				break; /* add_channel failed, punt */
599 			}
600 		} else
601 			break; /* no more channels available */
602 		if (max_channels && nr_channels >= max_channels)
603 			break; /* we have all we need */
604 	}
605 
606 	return err;
607 }
608 /* when compiled-in wait for drivers to load first */
609 late_initcall(dmatest_init);
610 
611 static void __exit dmatest_exit(void)
612 {
613 	struct dmatest_chan *dtc, *_dtc;
614 	struct dma_chan *chan;
615 
616 	list_for_each_entry_safe(dtc, _dtc, &dmatest_channels, node) {
617 		list_del(&dtc->node);
618 		chan = dtc->chan;
619 		dmatest_cleanup_channel(dtc);
620 		pr_debug("dmatest: dropped channel %s\n",
621 			 dma_chan_name(chan));
622 		dma_release_channel(chan);
623 	}
624 }
625 module_exit(dmatest_exit);
626 
627 MODULE_AUTHOR("Haavard Skinnemoen <hskinnemoen@atmel.com>");
628 MODULE_LICENSE("GPL v2");
629