Loading...
1// SPDX-License-Identifier: GPL-2.0-only
2/*
3 * DMA Engine test module
4 *
5 * Copyright (C) 2007 Atmel Corporation
6 * Copyright (C) 2013 Intel Corporation
7 */
8#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
9
10#include <linux/delay.h>
11#include <linux/dma-mapping.h>
12#include <linux/dmaengine.h>
13#include <linux/freezer.h>
14#include <linux/init.h>
15#include <linux/kthread.h>
16#include <linux/sched/task.h>
17#include <linux/module.h>
18#include <linux/moduleparam.h>
19#include <linux/random.h>
20#include <linux/slab.h>
21#include <linux/wait.h>
22
23static unsigned int test_buf_size = 16384;
24module_param(test_buf_size, uint, S_IRUGO | S_IWUSR);
25MODULE_PARM_DESC(test_buf_size, "Size of the memcpy test buffer");
26
27static char test_device[32];
28module_param_string(device, test_device, sizeof(test_device),
29 S_IRUGO | S_IWUSR);
30MODULE_PARM_DESC(device, "Bus ID of the DMA Engine to test (default: any)");
31
32static unsigned int threads_per_chan = 1;
33module_param(threads_per_chan, uint, S_IRUGO | S_IWUSR);
34MODULE_PARM_DESC(threads_per_chan,
35 "Number of threads to start per channel (default: 1)");
36
37static unsigned int max_channels;
38module_param(max_channels, uint, S_IRUGO | S_IWUSR);
39MODULE_PARM_DESC(max_channels,
40 "Maximum number of channels to use (default: all)");
41
42static unsigned int iterations;
43module_param(iterations, uint, S_IRUGO | S_IWUSR);
44MODULE_PARM_DESC(iterations,
45 "Iterations before stopping test (default: infinite)");
46
47static unsigned int dmatest;
48module_param(dmatest, uint, S_IRUGO | S_IWUSR);
49MODULE_PARM_DESC(dmatest,
50 "dmatest 0-memcpy 1-memset (default: 0)");
51
52static unsigned int xor_sources = 3;
53module_param(xor_sources, uint, S_IRUGO | S_IWUSR);
54MODULE_PARM_DESC(xor_sources,
55 "Number of xor source buffers (default: 3)");
56
57static unsigned int pq_sources = 3;
58module_param(pq_sources, uint, S_IRUGO | S_IWUSR);
59MODULE_PARM_DESC(pq_sources,
60 "Number of p+q source buffers (default: 3)");
61
62static int timeout = 3000;
63module_param(timeout, int, S_IRUGO | S_IWUSR);
64MODULE_PARM_DESC(timeout, "Transfer Timeout in msec (default: 3000), "
65 "Pass -1 for infinite timeout");
66
67static bool noverify;
68module_param(noverify, bool, S_IRUGO | S_IWUSR);
69MODULE_PARM_DESC(noverify, "Disable data verification (default: verify)");
70
71static bool norandom;
72module_param(norandom, bool, 0644);
73MODULE_PARM_DESC(norandom, "Disable random offset setup (default: random)");
74
75static bool verbose;
76module_param(verbose, bool, S_IRUGO | S_IWUSR);
77MODULE_PARM_DESC(verbose, "Enable \"success\" result messages (default: off)");
78
79static int alignment = -1;
80module_param(alignment, int, 0644);
81MODULE_PARM_DESC(alignment, "Custom data address alignment taken as 2^(alignment) (default: not used (-1))");
82
83static unsigned int transfer_size;
84module_param(transfer_size, uint, 0644);
85MODULE_PARM_DESC(transfer_size, "Optional custom transfer size in bytes (default: not used (0))");
86
87static bool polled;
88module_param(polled, bool, S_IRUGO | S_IWUSR);
89MODULE_PARM_DESC(polled, "Use polling for completion instead of interrupts");
90
91/**
92 * struct dmatest_params - test parameters.
93 * @buf_size: size of the memcpy test buffer
94 * @channel: bus ID of the channel to test
95 * @device: bus ID of the DMA Engine to test
96 * @threads_per_chan: number of threads to start per channel
97 * @max_channels: maximum number of channels to use
98 * @iterations: iterations before stopping test
99 * @xor_sources: number of xor source buffers
100 * @pq_sources: number of p+q source buffers
101 * @timeout: transfer timeout in msec, -1 for infinite timeout
102 * @noverify: disable data verification
103 * @norandom: disable random offset setup
104 * @alignment: custom data address alignment taken as 2^alignment
105 * @transfer_size: custom transfer size in bytes
106 * @polled: use polling for completion instead of interrupts
107 */
108struct dmatest_params {
109 unsigned int buf_size;
110 char channel[20];
111 char device[32];
112 unsigned int threads_per_chan;
113 unsigned int max_channels;
114 unsigned int iterations;
115 unsigned int xor_sources;
116 unsigned int pq_sources;
117 int timeout;
118 bool noverify;
119 bool norandom;
120 int alignment;
121 unsigned int transfer_size;
122 bool polled;
123};
124
125/**
126 * struct dmatest_info - test information.
127 * @params: test parameters
128 * @channels: channels under test
129 * @nr_channels: number of channels under test
130 * @lock: access protection to the fields of this structure
131 * @did_init: module has been initialized completely
132 * @last_error: test has faced configuration issues
133 */
134static struct dmatest_info {
135 /* Test parameters */
136 struct dmatest_params params;
137
138 /* Internal state */
139 struct list_head channels;
140 unsigned int nr_channels;
141 int last_error;
142 struct mutex lock;
143 bool did_init;
144} test_info = {
145 .channels = LIST_HEAD_INIT(test_info.channels),
146 .lock = __MUTEX_INITIALIZER(test_info.lock),
147};
148
149static int dmatest_run_set(const char *val, const struct kernel_param *kp);
150static int dmatest_run_get(char *val, const struct kernel_param *kp);
151static const struct kernel_param_ops run_ops = {
152 .set = dmatest_run_set,
153 .get = dmatest_run_get,
154};
155static bool dmatest_run;
156module_param_cb(run, &run_ops, &dmatest_run, S_IRUGO | S_IWUSR);
157MODULE_PARM_DESC(run, "Run the test (default: false)");
158
159static int dmatest_chan_set(const char *val, const struct kernel_param *kp);
160static int dmatest_chan_get(char *val, const struct kernel_param *kp);
161static const struct kernel_param_ops multi_chan_ops = {
162 .set = dmatest_chan_set,
163 .get = dmatest_chan_get,
164};
165
166static char test_channel[20];
167static struct kparam_string newchan_kps = {
168 .string = test_channel,
169 .maxlen = 20,
170};
171module_param_cb(channel, &multi_chan_ops, &newchan_kps, 0644);
172MODULE_PARM_DESC(channel, "Bus ID of the channel to test (default: any)");
173
174static int dmatest_test_list_get(char *val, const struct kernel_param *kp);
175static const struct kernel_param_ops test_list_ops = {
176 .get = dmatest_test_list_get,
177};
178module_param_cb(test_list, &test_list_ops, NULL, 0444);
179MODULE_PARM_DESC(test_list, "Print current test list");
180
181/* Maximum amount of mismatched bytes in buffer to print */
182#define MAX_ERROR_COUNT 32
183
184/*
185 * Initialization patterns. All bytes in the source buffer has bit 7
186 * set, all bytes in the destination buffer has bit 7 cleared.
187 *
188 * Bit 6 is set for all bytes which are to be copied by the DMA
189 * engine. Bit 5 is set for all bytes which are to be overwritten by
190 * the DMA engine.
191 *
192 * The remaining bits are the inverse of a counter which increments by
193 * one for each byte address.
194 */
195#define PATTERN_SRC 0x80
196#define PATTERN_DST 0x00
197#define PATTERN_COPY 0x40
198#define PATTERN_OVERWRITE 0x20
199#define PATTERN_COUNT_MASK 0x1f
200#define PATTERN_MEMSET_IDX 0x01
201
202/* Fixed point arithmetic ops */
203#define FIXPT_SHIFT 8
204#define FIXPNT_MASK 0xFF
205#define FIXPT_TO_INT(a) ((a) >> FIXPT_SHIFT)
206#define INT_TO_FIXPT(a) ((a) << FIXPT_SHIFT)
207#define FIXPT_GET_FRAC(a) ((((a) & FIXPNT_MASK) * 100) >> FIXPT_SHIFT)
208
209/* poor man's completion - we want to use wait_event_freezable() on it */
210struct dmatest_done {
211 bool done;
212 wait_queue_head_t *wait;
213};
214
215struct dmatest_data {
216 u8 **raw;
217 u8 **aligned;
218 unsigned int cnt;
219 unsigned int off;
220};
221
222struct dmatest_thread {
223 struct list_head node;
224 struct dmatest_info *info;
225 struct task_struct *task;
226 struct dma_chan *chan;
227 struct dmatest_data src;
228 struct dmatest_data dst;
229 enum dma_transaction_type type;
230 wait_queue_head_t done_wait;
231 struct dmatest_done test_done;
232 bool done;
233 bool pending;
234};
235
236struct dmatest_chan {
237 struct list_head node;
238 struct dma_chan *chan;
239 struct list_head threads;
240};
241
242static DECLARE_WAIT_QUEUE_HEAD(thread_wait);
243static bool wait;
244
245static bool is_threaded_test_run(struct dmatest_info *info)
246{
247 struct dmatest_chan *dtc;
248
249 list_for_each_entry(dtc, &info->channels, node) {
250 struct dmatest_thread *thread;
251
252 list_for_each_entry(thread, &dtc->threads, node) {
253 if (!thread->done && !thread->pending)
254 return true;
255 }
256 }
257
258 return false;
259}
260
261static bool is_threaded_test_pending(struct dmatest_info *info)
262{
263 struct dmatest_chan *dtc;
264
265 list_for_each_entry(dtc, &info->channels, node) {
266 struct dmatest_thread *thread;
267
268 list_for_each_entry(thread, &dtc->threads, node) {
269 if (thread->pending)
270 return true;
271 }
272 }
273
274 return false;
275}
276
277static int dmatest_wait_get(char *val, const struct kernel_param *kp)
278{
279 struct dmatest_info *info = &test_info;
280 struct dmatest_params *params = &info->params;
281
282 if (params->iterations)
283 wait_event(thread_wait, !is_threaded_test_run(info));
284 wait = true;
285 return param_get_bool(val, kp);
286}
287
288static const struct kernel_param_ops wait_ops = {
289 .get = dmatest_wait_get,
290 .set = param_set_bool,
291};
292module_param_cb(wait, &wait_ops, &wait, S_IRUGO);
293MODULE_PARM_DESC(wait, "Wait for tests to complete (default: false)");
294
295static bool dmatest_match_channel(struct dmatest_params *params,
296 struct dma_chan *chan)
297{
298 if (params->channel[0] == '\0')
299 return true;
300 return strcmp(dma_chan_name(chan), params->channel) == 0;
301}
302
303static bool dmatest_match_device(struct dmatest_params *params,
304 struct dma_device *device)
305{
306 if (params->device[0] == '\0')
307 return true;
308 return strcmp(dev_name(device->dev), params->device) == 0;
309}
310
311static unsigned long dmatest_random(void)
312{
313 unsigned long buf;
314
315 prandom_bytes(&buf, sizeof(buf));
316 return buf;
317}
318
319static inline u8 gen_inv_idx(u8 index, bool is_memset)
320{
321 u8 val = is_memset ? PATTERN_MEMSET_IDX : index;
322
323 return ~val & PATTERN_COUNT_MASK;
324}
325
326static inline u8 gen_src_value(u8 index, bool is_memset)
327{
328 return PATTERN_SRC | gen_inv_idx(index, is_memset);
329}
330
331static inline u8 gen_dst_value(u8 index, bool is_memset)
332{
333 return PATTERN_DST | gen_inv_idx(index, is_memset);
334}
335
336static void dmatest_init_srcs(u8 **bufs, unsigned int start, unsigned int len,
337 unsigned int buf_size, bool is_memset)
338{
339 unsigned int i;
340 u8 *buf;
341
342 for (; (buf = *bufs); bufs++) {
343 for (i = 0; i < start; i++)
344 buf[i] = gen_src_value(i, is_memset);
345 for ( ; i < start + len; i++)
346 buf[i] = gen_src_value(i, is_memset) | PATTERN_COPY;
347 for ( ; i < buf_size; i++)
348 buf[i] = gen_src_value(i, is_memset);
349 buf++;
350 }
351}
352
353static void dmatest_init_dsts(u8 **bufs, unsigned int start, unsigned int len,
354 unsigned int buf_size, bool is_memset)
355{
356 unsigned int i;
357 u8 *buf;
358
359 for (; (buf = *bufs); bufs++) {
360 for (i = 0; i < start; i++)
361 buf[i] = gen_dst_value(i, is_memset);
362 for ( ; i < start + len; i++)
363 buf[i] = gen_dst_value(i, is_memset) |
364 PATTERN_OVERWRITE;
365 for ( ; i < buf_size; i++)
366 buf[i] = gen_dst_value(i, is_memset);
367 }
368}
369
370static void dmatest_mismatch(u8 actual, u8 pattern, unsigned int index,
371 unsigned int counter, bool is_srcbuf, bool is_memset)
372{
373 u8 diff = actual ^ pattern;
374 u8 expected = pattern | gen_inv_idx(counter, is_memset);
375 const char *thread_name = current->comm;
376
377 if (is_srcbuf)
378 pr_warn("%s: srcbuf[0x%x] overwritten! Expected %02x, got %02x\n",
379 thread_name, index, expected, actual);
380 else if ((pattern & PATTERN_COPY)
381 && (diff & (PATTERN_COPY | PATTERN_OVERWRITE)))
382 pr_warn("%s: dstbuf[0x%x] not copied! Expected %02x, got %02x\n",
383 thread_name, index, expected, actual);
384 else if (diff & PATTERN_SRC)
385 pr_warn("%s: dstbuf[0x%x] was copied! Expected %02x, got %02x\n",
386 thread_name, index, expected, actual);
387 else
388 pr_warn("%s: dstbuf[0x%x] mismatch! Expected %02x, got %02x\n",
389 thread_name, index, expected, actual);
390}
391
392static unsigned int dmatest_verify(u8 **bufs, unsigned int start,
393 unsigned int end, unsigned int counter, u8 pattern,
394 bool is_srcbuf, bool is_memset)
395{
396 unsigned int i;
397 unsigned int error_count = 0;
398 u8 actual;
399 u8 expected;
400 u8 *buf;
401 unsigned int counter_orig = counter;
402
403 for (; (buf = *bufs); bufs++) {
404 counter = counter_orig;
405 for (i = start; i < end; i++) {
406 actual = buf[i];
407 expected = pattern | gen_inv_idx(counter, is_memset);
408 if (actual != expected) {
409 if (error_count < MAX_ERROR_COUNT)
410 dmatest_mismatch(actual, pattern, i,
411 counter, is_srcbuf,
412 is_memset);
413 error_count++;
414 }
415 counter++;
416 }
417 }
418
419 if (error_count > MAX_ERROR_COUNT)
420 pr_warn("%s: %u errors suppressed\n",
421 current->comm, error_count - MAX_ERROR_COUNT);
422
423 return error_count;
424}
425
426
427static void dmatest_callback(void *arg)
428{
429 struct dmatest_done *done = arg;
430 struct dmatest_thread *thread =
431 container_of(done, struct dmatest_thread, test_done);
432 if (!thread->done) {
433 done->done = true;
434 wake_up_all(done->wait);
435 } else {
436 /*
437 * If thread->done, it means that this callback occurred
438 * after the parent thread has cleaned up. This can
439 * happen in the case that driver doesn't implement
440 * the terminate_all() functionality and a dma operation
441 * did not occur within the timeout period
442 */
443 WARN(1, "dmatest: Kernel memory may be corrupted!!\n");
444 }
445}
446
447static unsigned int min_odd(unsigned int x, unsigned int y)
448{
449 unsigned int val = min(x, y);
450
451 return val % 2 ? val : val - 1;
452}
453
454static void result(const char *err, unsigned int n, unsigned int src_off,
455 unsigned int dst_off, unsigned int len, unsigned long data)
456{
457 pr_info("%s: result #%u: '%s' with src_off=0x%x dst_off=0x%x len=0x%x (%lu)\n",
458 current->comm, n, err, src_off, dst_off, len, data);
459}
460
461static void dbg_result(const char *err, unsigned int n, unsigned int src_off,
462 unsigned int dst_off, unsigned int len,
463 unsigned long data)
464{
465 pr_debug("%s: result #%u: '%s' with src_off=0x%x dst_off=0x%x len=0x%x (%lu)\n",
466 current->comm, n, err, src_off, dst_off, len, data);
467}
468
469#define verbose_result(err, n, src_off, dst_off, len, data) ({ \
470 if (verbose) \
471 result(err, n, src_off, dst_off, len, data); \
472 else \
473 dbg_result(err, n, src_off, dst_off, len, data);\
474})
475
476static unsigned long long dmatest_persec(s64 runtime, unsigned int val)
477{
478 unsigned long long per_sec = 1000000;
479
480 if (runtime <= 0)
481 return 0;
482
483 /* drop precision until runtime is 32-bits */
484 while (runtime > UINT_MAX) {
485 runtime >>= 1;
486 per_sec <<= 1;
487 }
488
489 per_sec *= val;
490 per_sec = INT_TO_FIXPT(per_sec);
491 do_div(per_sec, runtime);
492
493 return per_sec;
494}
495
496static unsigned long long dmatest_KBs(s64 runtime, unsigned long long len)
497{
498 return FIXPT_TO_INT(dmatest_persec(runtime, len >> 10));
499}
500
501static void __dmatest_free_test_data(struct dmatest_data *d, unsigned int cnt)
502{
503 unsigned int i;
504
505 for (i = 0; i < cnt; i++)
506 kfree(d->raw[i]);
507
508 kfree(d->aligned);
509 kfree(d->raw);
510}
511
512static void dmatest_free_test_data(struct dmatest_data *d)
513{
514 __dmatest_free_test_data(d, d->cnt);
515}
516
517static int dmatest_alloc_test_data(struct dmatest_data *d,
518 unsigned int buf_size, u8 align)
519{
520 unsigned int i = 0;
521
522 d->raw = kcalloc(d->cnt + 1, sizeof(u8 *), GFP_KERNEL);
523 if (!d->raw)
524 return -ENOMEM;
525
526 d->aligned = kcalloc(d->cnt + 1, sizeof(u8 *), GFP_KERNEL);
527 if (!d->aligned)
528 goto err;
529
530 for (i = 0; i < d->cnt; i++) {
531 d->raw[i] = kmalloc(buf_size + align, GFP_KERNEL);
532 if (!d->raw[i])
533 goto err;
534
535 /* align to alignment restriction */
536 if (align)
537 d->aligned[i] = PTR_ALIGN(d->raw[i], align);
538 else
539 d->aligned[i] = d->raw[i];
540 }
541
542 return 0;
543err:
544 __dmatest_free_test_data(d, i);
545 return -ENOMEM;
546}
547
548/*
549 * This function repeatedly tests DMA transfers of various lengths and
550 * offsets for a given operation type until it is told to exit by
551 * kthread_stop(). There may be multiple threads running this function
552 * in parallel for a single channel, and there may be multiple channels
553 * being tested in parallel.
554 *
555 * Before each test, the source and destination buffer is initialized
556 * with a known pattern. This pattern is different depending on
557 * whether it's in an area which is supposed to be copied or
558 * overwritten, and different in the source and destination buffers.
559 * So if the DMA engine doesn't copy exactly what we tell it to copy,
560 * we'll notice.
561 */
562static int dmatest_func(void *data)
563{
564 struct dmatest_thread *thread = data;
565 struct dmatest_done *done = &thread->test_done;
566 struct dmatest_info *info;
567 struct dmatest_params *params;
568 struct dma_chan *chan;
569 struct dma_device *dev;
570 unsigned int error_count;
571 unsigned int failed_tests = 0;
572 unsigned int total_tests = 0;
573 dma_cookie_t cookie;
574 enum dma_status status;
575 enum dma_ctrl_flags flags;
576 u8 *pq_coefs = NULL;
577 int ret;
578 unsigned int buf_size;
579 struct dmatest_data *src;
580 struct dmatest_data *dst;
581 int i;
582 ktime_t ktime, start, diff;
583 ktime_t filltime = 0;
584 ktime_t comparetime = 0;
585 s64 runtime = 0;
586 unsigned long long total_len = 0;
587 unsigned long long iops = 0;
588 u8 align = 0;
589 bool is_memset = false;
590 dma_addr_t *srcs;
591 dma_addr_t *dma_pq;
592
593 set_freezable();
594
595 ret = -ENOMEM;
596
597 smp_rmb();
598 thread->pending = false;
599 info = thread->info;
600 params = &info->params;
601 chan = thread->chan;
602 dev = chan->device;
603 src = &thread->src;
604 dst = &thread->dst;
605 if (thread->type == DMA_MEMCPY) {
606 align = params->alignment < 0 ? dev->copy_align :
607 params->alignment;
608 src->cnt = dst->cnt = 1;
609 } else if (thread->type == DMA_MEMSET) {
610 align = params->alignment < 0 ? dev->fill_align :
611 params->alignment;
612 src->cnt = dst->cnt = 1;
613 is_memset = true;
614 } else if (thread->type == DMA_XOR) {
615 /* force odd to ensure dst = src */
616 src->cnt = min_odd(params->xor_sources | 1, dev->max_xor);
617 dst->cnt = 1;
618 align = params->alignment < 0 ? dev->xor_align :
619 params->alignment;
620 } else if (thread->type == DMA_PQ) {
621 /* force odd to ensure dst = src */
622 src->cnt = min_odd(params->pq_sources | 1, dma_maxpq(dev, 0));
623 dst->cnt = 2;
624 align = params->alignment < 0 ? dev->pq_align :
625 params->alignment;
626
627 pq_coefs = kmalloc(params->pq_sources + 1, GFP_KERNEL);
628 if (!pq_coefs)
629 goto err_thread_type;
630
631 for (i = 0; i < src->cnt; i++)
632 pq_coefs[i] = 1;
633 } else
634 goto err_thread_type;
635
636 /* Check if buffer count fits into map count variable (u8) */
637 if ((src->cnt + dst->cnt) >= 255) {
638 pr_err("too many buffers (%d of 255 supported)\n",
639 src->cnt + dst->cnt);
640 goto err_free_coefs;
641 }
642
643 buf_size = params->buf_size;
644 if (1 << align > buf_size) {
645 pr_err("%u-byte buffer too small for %d-byte alignment\n",
646 buf_size, 1 << align);
647 goto err_free_coefs;
648 }
649
650 if (dmatest_alloc_test_data(src, buf_size, align) < 0)
651 goto err_free_coefs;
652
653 if (dmatest_alloc_test_data(dst, buf_size, align) < 0)
654 goto err_src;
655
656 set_user_nice(current, 10);
657
658 srcs = kcalloc(src->cnt, sizeof(dma_addr_t), GFP_KERNEL);
659 if (!srcs)
660 goto err_dst;
661
662 dma_pq = kcalloc(dst->cnt, sizeof(dma_addr_t), GFP_KERNEL);
663 if (!dma_pq)
664 goto err_srcs_array;
665
666 /*
667 * src and dst buffers are freed by ourselves below
668 */
669 if (params->polled)
670 flags = DMA_CTRL_ACK;
671 else
672 flags = DMA_CTRL_ACK | DMA_PREP_INTERRUPT;
673
674 ktime = ktime_get();
675 while (!(kthread_should_stop() ||
676 (params->iterations && total_tests >= params->iterations))) {
677 struct dma_async_tx_descriptor *tx = NULL;
678 struct dmaengine_unmap_data *um;
679 dma_addr_t *dsts;
680 unsigned int len;
681
682 total_tests++;
683
684 if (params->transfer_size) {
685 if (params->transfer_size >= buf_size) {
686 pr_err("%u-byte transfer size must be lower than %u-buffer size\n",
687 params->transfer_size, buf_size);
688 break;
689 }
690 len = params->transfer_size;
691 } else if (params->norandom) {
692 len = buf_size;
693 } else {
694 len = dmatest_random() % buf_size + 1;
695 }
696
697 /* Do not alter transfer size explicitly defined by user */
698 if (!params->transfer_size) {
699 len = (len >> align) << align;
700 if (!len)
701 len = 1 << align;
702 }
703 total_len += len;
704
705 if (params->norandom) {
706 src->off = 0;
707 dst->off = 0;
708 } else {
709 src->off = dmatest_random() % (buf_size - len + 1);
710 dst->off = dmatest_random() % (buf_size - len + 1);
711
712 src->off = (src->off >> align) << align;
713 dst->off = (dst->off >> align) << align;
714 }
715
716 if (!params->noverify) {
717 start = ktime_get();
718 dmatest_init_srcs(src->aligned, src->off, len,
719 buf_size, is_memset);
720 dmatest_init_dsts(dst->aligned, dst->off, len,
721 buf_size, is_memset);
722
723 diff = ktime_sub(ktime_get(), start);
724 filltime = ktime_add(filltime, diff);
725 }
726
727 um = dmaengine_get_unmap_data(dev->dev, src->cnt + dst->cnt,
728 GFP_KERNEL);
729 if (!um) {
730 failed_tests++;
731 result("unmap data NULL", total_tests,
732 src->off, dst->off, len, ret);
733 continue;
734 }
735
736 um->len = buf_size;
737 for (i = 0; i < src->cnt; i++) {
738 void *buf = src->aligned[i];
739 struct page *pg = virt_to_page(buf);
740 unsigned long pg_off = offset_in_page(buf);
741
742 um->addr[i] = dma_map_page(dev->dev, pg, pg_off,
743 um->len, DMA_TO_DEVICE);
744 srcs[i] = um->addr[i] + src->off;
745 ret = dma_mapping_error(dev->dev, um->addr[i]);
746 if (ret) {
747 result("src mapping error", total_tests,
748 src->off, dst->off, len, ret);
749 goto error_unmap_continue;
750 }
751 um->to_cnt++;
752 }
753 /* map with DMA_BIDIRECTIONAL to force writeback/invalidate */
754 dsts = &um->addr[src->cnt];
755 for (i = 0; i < dst->cnt; i++) {
756 void *buf = dst->aligned[i];
757 struct page *pg = virt_to_page(buf);
758 unsigned long pg_off = offset_in_page(buf);
759
760 dsts[i] = dma_map_page(dev->dev, pg, pg_off, um->len,
761 DMA_BIDIRECTIONAL);
762 ret = dma_mapping_error(dev->dev, dsts[i]);
763 if (ret) {
764 result("dst mapping error", total_tests,
765 src->off, dst->off, len, ret);
766 goto error_unmap_continue;
767 }
768 um->bidi_cnt++;
769 }
770
771 if (thread->type == DMA_MEMCPY)
772 tx = dev->device_prep_dma_memcpy(chan,
773 dsts[0] + dst->off,
774 srcs[0], len, flags);
775 else if (thread->type == DMA_MEMSET)
776 tx = dev->device_prep_dma_memset(chan,
777 dsts[0] + dst->off,
778 *(src->aligned[0] + src->off),
779 len, flags);
780 else if (thread->type == DMA_XOR)
781 tx = dev->device_prep_dma_xor(chan,
782 dsts[0] + dst->off,
783 srcs, src->cnt,
784 len, flags);
785 else if (thread->type == DMA_PQ) {
786 for (i = 0; i < dst->cnt; i++)
787 dma_pq[i] = dsts[i] + dst->off;
788 tx = dev->device_prep_dma_pq(chan, dma_pq, srcs,
789 src->cnt, pq_coefs,
790 len, flags);
791 }
792
793 if (!tx) {
794 result("prep error", total_tests, src->off,
795 dst->off, len, ret);
796 msleep(100);
797 goto error_unmap_continue;
798 }
799
800 done->done = false;
801 if (!params->polled) {
802 tx->callback = dmatest_callback;
803 tx->callback_param = done;
804 }
805 cookie = tx->tx_submit(tx);
806
807 if (dma_submit_error(cookie)) {
808 result("submit error", total_tests, src->off,
809 dst->off, len, ret);
810 msleep(100);
811 goto error_unmap_continue;
812 }
813
814 if (params->polled) {
815 status = dma_sync_wait(chan, cookie);
816 dmaengine_terminate_sync(chan);
817 if (status == DMA_COMPLETE)
818 done->done = true;
819 } else {
820 dma_async_issue_pending(chan);
821
822 wait_event_freezable_timeout(thread->done_wait,
823 done->done,
824 msecs_to_jiffies(params->timeout));
825
826 status = dma_async_is_tx_complete(chan, cookie, NULL,
827 NULL);
828 }
829
830 if (!done->done) {
831 result("test timed out", total_tests, src->off, dst->off,
832 len, 0);
833 goto error_unmap_continue;
834 } else if (status != DMA_COMPLETE &&
835 !(dma_has_cap(DMA_COMPLETION_NO_ORDER,
836 dev->cap_mask) &&
837 status == DMA_OUT_OF_ORDER)) {
838 result(status == DMA_ERROR ?
839 "completion error status" :
840 "completion busy status", total_tests, src->off,
841 dst->off, len, ret);
842 goto error_unmap_continue;
843 }
844
845 dmaengine_unmap_put(um);
846
847 if (params->noverify) {
848 verbose_result("test passed", total_tests, src->off,
849 dst->off, len, 0);
850 continue;
851 }
852
853 start = ktime_get();
854 pr_debug("%s: verifying source buffer...\n", current->comm);
855 error_count = dmatest_verify(src->aligned, 0, src->off,
856 0, PATTERN_SRC, true, is_memset);
857 error_count += dmatest_verify(src->aligned, src->off,
858 src->off + len, src->off,
859 PATTERN_SRC | PATTERN_COPY, true, is_memset);
860 error_count += dmatest_verify(src->aligned, src->off + len,
861 buf_size, src->off + len,
862 PATTERN_SRC, true, is_memset);
863
864 pr_debug("%s: verifying dest buffer...\n", current->comm);
865 error_count += dmatest_verify(dst->aligned, 0, dst->off,
866 0, PATTERN_DST, false, is_memset);
867
868 error_count += dmatest_verify(dst->aligned, dst->off,
869 dst->off + len, src->off,
870 PATTERN_SRC | PATTERN_COPY, false, is_memset);
871
872 error_count += dmatest_verify(dst->aligned, dst->off + len,
873 buf_size, dst->off + len,
874 PATTERN_DST, false, is_memset);
875
876 diff = ktime_sub(ktime_get(), start);
877 comparetime = ktime_add(comparetime, diff);
878
879 if (error_count) {
880 result("data error", total_tests, src->off, dst->off,
881 len, error_count);
882 failed_tests++;
883 } else {
884 verbose_result("test passed", total_tests, src->off,
885 dst->off, len, 0);
886 }
887
888 continue;
889
890error_unmap_continue:
891 dmaengine_unmap_put(um);
892 failed_tests++;
893 }
894 ktime = ktime_sub(ktime_get(), ktime);
895 ktime = ktime_sub(ktime, comparetime);
896 ktime = ktime_sub(ktime, filltime);
897 runtime = ktime_to_us(ktime);
898
899 ret = 0;
900 kfree(dma_pq);
901err_srcs_array:
902 kfree(srcs);
903err_dst:
904 dmatest_free_test_data(dst);
905err_src:
906 dmatest_free_test_data(src);
907err_free_coefs:
908 kfree(pq_coefs);
909err_thread_type:
910 iops = dmatest_persec(runtime, total_tests);
911 pr_info("%s: summary %u tests, %u failures %llu.%02llu iops %llu KB/s (%d)\n",
912 current->comm, total_tests, failed_tests,
913 FIXPT_TO_INT(iops), FIXPT_GET_FRAC(iops),
914 dmatest_KBs(runtime, total_len), ret);
915
916 /* terminate all transfers on specified channels */
917 if (ret || failed_tests)
918 dmaengine_terminate_sync(chan);
919
920 thread->done = true;
921 wake_up(&thread_wait);
922
923 return ret;
924}
925
926static void dmatest_cleanup_channel(struct dmatest_chan *dtc)
927{
928 struct dmatest_thread *thread;
929 struct dmatest_thread *_thread;
930 int ret;
931
932 list_for_each_entry_safe(thread, _thread, &dtc->threads, node) {
933 ret = kthread_stop(thread->task);
934 pr_debug("thread %s exited with status %d\n",
935 thread->task->comm, ret);
936 list_del(&thread->node);
937 put_task_struct(thread->task);
938 kfree(thread);
939 }
940
941 /* terminate all transfers on specified channels */
942 dmaengine_terminate_sync(dtc->chan);
943
944 kfree(dtc);
945}
946
947static int dmatest_add_threads(struct dmatest_info *info,
948 struct dmatest_chan *dtc, enum dma_transaction_type type)
949{
950 struct dmatest_params *params = &info->params;
951 struct dmatest_thread *thread;
952 struct dma_chan *chan = dtc->chan;
953 char *op;
954 unsigned int i;
955
956 if (type == DMA_MEMCPY)
957 op = "copy";
958 else if (type == DMA_MEMSET)
959 op = "set";
960 else if (type == DMA_XOR)
961 op = "xor";
962 else if (type == DMA_PQ)
963 op = "pq";
964 else
965 return -EINVAL;
966
967 for (i = 0; i < params->threads_per_chan; i++) {
968 thread = kzalloc(sizeof(struct dmatest_thread), GFP_KERNEL);
969 if (!thread) {
970 pr_warn("No memory for %s-%s%u\n",
971 dma_chan_name(chan), op, i);
972 break;
973 }
974 thread->info = info;
975 thread->chan = dtc->chan;
976 thread->type = type;
977 thread->test_done.wait = &thread->done_wait;
978 init_waitqueue_head(&thread->done_wait);
979 smp_wmb();
980 thread->task = kthread_create(dmatest_func, thread, "%s-%s%u",
981 dma_chan_name(chan), op, i);
982 if (IS_ERR(thread->task)) {
983 pr_warn("Failed to create thread %s-%s%u\n",
984 dma_chan_name(chan), op, i);
985 kfree(thread);
986 break;
987 }
988
989 /* srcbuf and dstbuf are allocated by the thread itself */
990 get_task_struct(thread->task);
991 list_add_tail(&thread->node, &dtc->threads);
992 thread->pending = true;
993 }
994
995 return i;
996}
997
998static int dmatest_add_channel(struct dmatest_info *info,
999 struct dma_chan *chan)
1000{
1001 struct dmatest_chan *dtc;
1002 struct dma_device *dma_dev = chan->device;
1003 unsigned int thread_count = 0;
1004 int cnt;
1005
1006 dtc = kmalloc(sizeof(struct dmatest_chan), GFP_KERNEL);
1007 if (!dtc) {
1008 pr_warn("No memory for %s\n", dma_chan_name(chan));
1009 return -ENOMEM;
1010 }
1011
1012 dtc->chan = chan;
1013 INIT_LIST_HEAD(&dtc->threads);
1014
1015 if (dma_has_cap(DMA_COMPLETION_NO_ORDER, dma_dev->cap_mask) &&
1016 info->params.polled) {
1017 info->params.polled = false;
1018 pr_warn("DMA_COMPLETION_NO_ORDER, polled disabled\n");
1019 }
1020
1021 if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask)) {
1022 if (dmatest == 0) {
1023 cnt = dmatest_add_threads(info, dtc, DMA_MEMCPY);
1024 thread_count += cnt > 0 ? cnt : 0;
1025 }
1026 }
1027
1028 if (dma_has_cap(DMA_MEMSET, dma_dev->cap_mask)) {
1029 if (dmatest == 1) {
1030 cnt = dmatest_add_threads(info, dtc, DMA_MEMSET);
1031 thread_count += cnt > 0 ? cnt : 0;
1032 }
1033 }
1034
1035 if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
1036 cnt = dmatest_add_threads(info, dtc, DMA_XOR);
1037 thread_count += cnt > 0 ? cnt : 0;
1038 }
1039 if (dma_has_cap(DMA_PQ, dma_dev->cap_mask)) {
1040 cnt = dmatest_add_threads(info, dtc, DMA_PQ);
1041 thread_count += cnt > 0 ? cnt : 0;
1042 }
1043
1044 pr_info("Added %u threads using %s\n",
1045 thread_count, dma_chan_name(chan));
1046
1047 list_add_tail(&dtc->node, &info->channels);
1048 info->nr_channels++;
1049
1050 return 0;
1051}
1052
1053static bool filter(struct dma_chan *chan, void *param)
1054{
1055 struct dmatest_params *params = param;
1056
1057 if (!dmatest_match_channel(params, chan) ||
1058 !dmatest_match_device(params, chan->device))
1059 return false;
1060 else
1061 return true;
1062}
1063
1064static void request_channels(struct dmatest_info *info,
1065 enum dma_transaction_type type)
1066{
1067 dma_cap_mask_t mask;
1068
1069 dma_cap_zero(mask);
1070 dma_cap_set(type, mask);
1071 for (;;) {
1072 struct dmatest_params *params = &info->params;
1073 struct dma_chan *chan;
1074
1075 chan = dma_request_channel(mask, filter, params);
1076 if (chan) {
1077 if (dmatest_add_channel(info, chan)) {
1078 dma_release_channel(chan);
1079 break; /* add_channel failed, punt */
1080 }
1081 } else
1082 break; /* no more channels available */
1083 if (params->max_channels &&
1084 info->nr_channels >= params->max_channels)
1085 break; /* we have all we need */
1086 }
1087}
1088
1089static void add_threaded_test(struct dmatest_info *info)
1090{
1091 struct dmatest_params *params = &info->params;
1092
1093 /* Copy test parameters */
1094 params->buf_size = test_buf_size;
1095 strlcpy(params->channel, strim(test_channel), sizeof(params->channel));
1096 strlcpy(params->device, strim(test_device), sizeof(params->device));
1097 params->threads_per_chan = threads_per_chan;
1098 params->max_channels = max_channels;
1099 params->iterations = iterations;
1100 params->xor_sources = xor_sources;
1101 params->pq_sources = pq_sources;
1102 params->timeout = timeout;
1103 params->noverify = noverify;
1104 params->norandom = norandom;
1105 params->alignment = alignment;
1106 params->transfer_size = transfer_size;
1107 params->polled = polled;
1108
1109 request_channels(info, DMA_MEMCPY);
1110 request_channels(info, DMA_MEMSET);
1111 request_channels(info, DMA_XOR);
1112 request_channels(info, DMA_PQ);
1113}
1114
1115static void run_pending_tests(struct dmatest_info *info)
1116{
1117 struct dmatest_chan *dtc;
1118 unsigned int thread_count = 0;
1119
1120 list_for_each_entry(dtc, &info->channels, node) {
1121 struct dmatest_thread *thread;
1122
1123 thread_count = 0;
1124 list_for_each_entry(thread, &dtc->threads, node) {
1125 wake_up_process(thread->task);
1126 thread_count++;
1127 }
1128 pr_info("Started %u threads using %s\n",
1129 thread_count, dma_chan_name(dtc->chan));
1130 }
1131}
1132
1133static void stop_threaded_test(struct dmatest_info *info)
1134{
1135 struct dmatest_chan *dtc, *_dtc;
1136 struct dma_chan *chan;
1137
1138 list_for_each_entry_safe(dtc, _dtc, &info->channels, node) {
1139 list_del(&dtc->node);
1140 chan = dtc->chan;
1141 dmatest_cleanup_channel(dtc);
1142 pr_debug("dropped channel %s\n", dma_chan_name(chan));
1143 dma_release_channel(chan);
1144 }
1145
1146 info->nr_channels = 0;
1147}
1148
1149static void start_threaded_tests(struct dmatest_info *info)
1150{
1151 /* we might be called early to set run=, defer running until all
1152 * parameters have been evaluated
1153 */
1154 if (!info->did_init)
1155 return;
1156
1157 run_pending_tests(info);
1158}
1159
1160static int dmatest_run_get(char *val, const struct kernel_param *kp)
1161{
1162 struct dmatest_info *info = &test_info;
1163
1164 mutex_lock(&info->lock);
1165 if (is_threaded_test_run(info)) {
1166 dmatest_run = true;
1167 } else {
1168 if (!is_threaded_test_pending(info))
1169 stop_threaded_test(info);
1170 dmatest_run = false;
1171 }
1172 mutex_unlock(&info->lock);
1173
1174 return param_get_bool(val, kp);
1175}
1176
1177static int dmatest_run_set(const char *val, const struct kernel_param *kp)
1178{
1179 struct dmatest_info *info = &test_info;
1180 int ret;
1181
1182 mutex_lock(&info->lock);
1183 ret = param_set_bool(val, kp);
1184 if (ret) {
1185 mutex_unlock(&info->lock);
1186 return ret;
1187 } else if (dmatest_run) {
1188 if (!is_threaded_test_pending(info)) {
1189 /*
1190 * We have nothing to run. This can be due to:
1191 */
1192 ret = info->last_error;
1193 if (ret) {
1194 /* 1) Misconfiguration */
1195 pr_err("Channel misconfigured, can't continue\n");
1196 mutex_unlock(&info->lock);
1197 return ret;
1198 } else {
1199 /* 2) We rely on defaults */
1200 pr_info("No channels configured, continue with any\n");
1201 if (!is_threaded_test_run(info))
1202 stop_threaded_test(info);
1203 add_threaded_test(info);
1204 }
1205 }
1206 start_threaded_tests(info);
1207 } else {
1208 stop_threaded_test(info);
1209 }
1210
1211 mutex_unlock(&info->lock);
1212
1213 return ret;
1214}
1215
1216static int dmatest_chan_set(const char *val, const struct kernel_param *kp)
1217{
1218 struct dmatest_info *info = &test_info;
1219 struct dmatest_chan *dtc;
1220 char chan_reset_val[20];
1221 int ret;
1222
1223 mutex_lock(&info->lock);
1224 ret = param_set_copystring(val, kp);
1225 if (ret) {
1226 mutex_unlock(&info->lock);
1227 return ret;
1228 }
1229 /*Clear any previously run threads */
1230 if (!is_threaded_test_run(info) && !is_threaded_test_pending(info))
1231 stop_threaded_test(info);
1232 /* Reject channels that are already registered */
1233 if (is_threaded_test_pending(info)) {
1234 list_for_each_entry(dtc, &info->channels, node) {
1235 if (strcmp(dma_chan_name(dtc->chan),
1236 strim(test_channel)) == 0) {
1237 dtc = list_last_entry(&info->channels,
1238 struct dmatest_chan,
1239 node);
1240 strlcpy(chan_reset_val,
1241 dma_chan_name(dtc->chan),
1242 sizeof(chan_reset_val));
1243 ret = -EBUSY;
1244 goto add_chan_err;
1245 }
1246 }
1247 }
1248
1249 add_threaded_test(info);
1250
1251 /* Check if channel was added successfully */
1252 dtc = list_last_entry(&info->channels, struct dmatest_chan, node);
1253
1254 if (dtc->chan) {
1255 /*
1256 * if new channel was not successfully added, revert the
1257 * "test_channel" string to the name of the last successfully
1258 * added channel. exception for when users issues empty string
1259 * to channel parameter.
1260 */
1261 if ((strcmp(dma_chan_name(dtc->chan), strim(test_channel)) != 0)
1262 && (strcmp("", strim(test_channel)) != 0)) {
1263 ret = -EINVAL;
1264 strlcpy(chan_reset_val, dma_chan_name(dtc->chan),
1265 sizeof(chan_reset_val));
1266 goto add_chan_err;
1267 }
1268
1269 } else {
1270 /* Clear test_channel if no channels were added successfully */
1271 strlcpy(chan_reset_val, "", sizeof(chan_reset_val));
1272 ret = -EBUSY;
1273 goto add_chan_err;
1274 }
1275
1276 info->last_error = ret;
1277 mutex_unlock(&info->lock);
1278
1279 return ret;
1280
1281add_chan_err:
1282 param_set_copystring(chan_reset_val, kp);
1283 info->last_error = ret;
1284 mutex_unlock(&info->lock);
1285
1286 return ret;
1287}
1288
1289static int dmatest_chan_get(char *val, const struct kernel_param *kp)
1290{
1291 struct dmatest_info *info = &test_info;
1292
1293 mutex_lock(&info->lock);
1294 if (!is_threaded_test_run(info) && !is_threaded_test_pending(info)) {
1295 stop_threaded_test(info);
1296 strlcpy(test_channel, "", sizeof(test_channel));
1297 }
1298 mutex_unlock(&info->lock);
1299
1300 return param_get_string(val, kp);
1301}
1302
1303static int dmatest_test_list_get(char *val, const struct kernel_param *kp)
1304{
1305 struct dmatest_info *info = &test_info;
1306 struct dmatest_chan *dtc;
1307 unsigned int thread_count = 0;
1308
1309 list_for_each_entry(dtc, &info->channels, node) {
1310 struct dmatest_thread *thread;
1311
1312 thread_count = 0;
1313 list_for_each_entry(thread, &dtc->threads, node) {
1314 thread_count++;
1315 }
1316 pr_info("%u threads using %s\n",
1317 thread_count, dma_chan_name(dtc->chan));
1318 }
1319
1320 return 0;
1321}
1322
1323static int __init dmatest_init(void)
1324{
1325 struct dmatest_info *info = &test_info;
1326 struct dmatest_params *params = &info->params;
1327
1328 if (dmatest_run) {
1329 mutex_lock(&info->lock);
1330 add_threaded_test(info);
1331 run_pending_tests(info);
1332 mutex_unlock(&info->lock);
1333 }
1334
1335 if (params->iterations && wait)
1336 wait_event(thread_wait, !is_threaded_test_run(info));
1337
1338 /* module parameters are stable, inittime tests are started,
1339 * let userspace take over 'run' control
1340 */
1341 info->did_init = true;
1342
1343 return 0;
1344}
1345/* when compiled-in wait for drivers to load first */
1346late_initcall(dmatest_init);
1347
1348static void __exit dmatest_exit(void)
1349{
1350 struct dmatest_info *info = &test_info;
1351
1352 mutex_lock(&info->lock);
1353 stop_threaded_test(info);
1354 mutex_unlock(&info->lock);
1355}
1356module_exit(dmatest_exit);
1357
1358MODULE_AUTHOR("Haavard Skinnemoen (Atmel)");
1359MODULE_LICENSE("GPL v2");
1/*
2 * DMA Engine test module
3 *
4 * Copyright (C) 2007 Atmel Corporation
5 * Copyright (C) 2013 Intel Corporation
6 *
7 * This program is free software; you can redistribute it and/or modify
8 * it under the terms of the GNU General Public License version 2 as
9 * published by the Free Software Foundation.
10 */
11#define pr_fmt(fmt) KBUILD_MODNAME ": " fmt
12
13#include <linux/delay.h>
14#include <linux/dma-mapping.h>
15#include <linux/dmaengine.h>
16#include <linux/freezer.h>
17#include <linux/init.h>
18#include <linux/kthread.h>
19#include <linux/sched/task.h>
20#include <linux/module.h>
21#include <linux/moduleparam.h>
22#include <linux/random.h>
23#include <linux/slab.h>
24#include <linux/wait.h>
25
26static unsigned int test_buf_size = 16384;
27module_param(test_buf_size, uint, S_IRUGO | S_IWUSR);
28MODULE_PARM_DESC(test_buf_size, "Size of the memcpy test buffer");
29
30static char test_channel[20];
31module_param_string(channel, test_channel, sizeof(test_channel),
32 S_IRUGO | S_IWUSR);
33MODULE_PARM_DESC(channel, "Bus ID of the channel to test (default: any)");
34
35static char test_device[32];
36module_param_string(device, test_device, sizeof(test_device),
37 S_IRUGO | S_IWUSR);
38MODULE_PARM_DESC(device, "Bus ID of the DMA Engine to test (default: any)");
39
40static unsigned int threads_per_chan = 1;
41module_param(threads_per_chan, uint, S_IRUGO | S_IWUSR);
42MODULE_PARM_DESC(threads_per_chan,
43 "Number of threads to start per channel (default: 1)");
44
45static unsigned int max_channels;
46module_param(max_channels, uint, S_IRUGO | S_IWUSR);
47MODULE_PARM_DESC(max_channels,
48 "Maximum number of channels to use (default: all)");
49
50static unsigned int iterations;
51module_param(iterations, uint, S_IRUGO | S_IWUSR);
52MODULE_PARM_DESC(iterations,
53 "Iterations before stopping test (default: infinite)");
54
55static unsigned int dmatest;
56module_param(dmatest, uint, S_IRUGO | S_IWUSR);
57MODULE_PARM_DESC(dmatest,
58 "dmatest 0-memcpy 1-memset (default: 0)");
59
60static unsigned int xor_sources = 3;
61module_param(xor_sources, uint, S_IRUGO | S_IWUSR);
62MODULE_PARM_DESC(xor_sources,
63 "Number of xor source buffers (default: 3)");
64
65static unsigned int pq_sources = 3;
66module_param(pq_sources, uint, S_IRUGO | S_IWUSR);
67MODULE_PARM_DESC(pq_sources,
68 "Number of p+q source buffers (default: 3)");
69
70static int timeout = 3000;
71module_param(timeout, uint, S_IRUGO | S_IWUSR);
72MODULE_PARM_DESC(timeout, "Transfer Timeout in msec (default: 3000), "
73 "Pass -1 for infinite timeout");
74
75static bool noverify;
76module_param(noverify, bool, S_IRUGO | S_IWUSR);
77MODULE_PARM_DESC(noverify, "Disable data verification (default: verify)");
78
79static bool norandom;
80module_param(norandom, bool, 0644);
81MODULE_PARM_DESC(norandom, "Disable random offset setup (default: random)");
82
83static bool verbose;
84module_param(verbose, bool, S_IRUGO | S_IWUSR);
85MODULE_PARM_DESC(verbose, "Enable \"success\" result messages (default: off)");
86
87/**
88 * struct dmatest_params - test parameters.
89 * @buf_size: size of the memcpy test buffer
90 * @channel: bus ID of the channel to test
91 * @device: bus ID of the DMA Engine to test
92 * @threads_per_chan: number of threads to start per channel
93 * @max_channels: maximum number of channels to use
94 * @iterations: iterations before stopping test
95 * @xor_sources: number of xor source buffers
96 * @pq_sources: number of p+q source buffers
97 * @timeout: transfer timeout in msec, -1 for infinite timeout
98 */
99struct dmatest_params {
100 unsigned int buf_size;
101 char channel[20];
102 char device[32];
103 unsigned int threads_per_chan;
104 unsigned int max_channels;
105 unsigned int iterations;
106 unsigned int xor_sources;
107 unsigned int pq_sources;
108 int timeout;
109 bool noverify;
110 bool norandom;
111};
112
113/**
114 * struct dmatest_info - test information.
115 * @params: test parameters
116 * @lock: access protection to the fields of this structure
117 */
118static struct dmatest_info {
119 /* Test parameters */
120 struct dmatest_params params;
121
122 /* Internal state */
123 struct list_head channels;
124 unsigned int nr_channels;
125 struct mutex lock;
126 bool did_init;
127} test_info = {
128 .channels = LIST_HEAD_INIT(test_info.channels),
129 .lock = __MUTEX_INITIALIZER(test_info.lock),
130};
131
132static int dmatest_run_set(const char *val, const struct kernel_param *kp);
133static int dmatest_run_get(char *val, const struct kernel_param *kp);
134static const struct kernel_param_ops run_ops = {
135 .set = dmatest_run_set,
136 .get = dmatest_run_get,
137};
138static bool dmatest_run;
139module_param_cb(run, &run_ops, &dmatest_run, S_IRUGO | S_IWUSR);
140MODULE_PARM_DESC(run, "Run the test (default: false)");
141
142/* Maximum amount of mismatched bytes in buffer to print */
143#define MAX_ERROR_COUNT 32
144
145/*
146 * Initialization patterns. All bytes in the source buffer has bit 7
147 * set, all bytes in the destination buffer has bit 7 cleared.
148 *
149 * Bit 6 is set for all bytes which are to be copied by the DMA
150 * engine. Bit 5 is set for all bytes which are to be overwritten by
151 * the DMA engine.
152 *
153 * The remaining bits are the inverse of a counter which increments by
154 * one for each byte address.
155 */
156#define PATTERN_SRC 0x80
157#define PATTERN_DST 0x00
158#define PATTERN_COPY 0x40
159#define PATTERN_OVERWRITE 0x20
160#define PATTERN_COUNT_MASK 0x1f
161#define PATTERN_MEMSET_IDX 0x01
162
163/* poor man's completion - we want to use wait_event_freezable() on it */
164struct dmatest_done {
165 bool done;
166 wait_queue_head_t *wait;
167};
168
169struct dmatest_thread {
170 struct list_head node;
171 struct dmatest_info *info;
172 struct task_struct *task;
173 struct dma_chan *chan;
174 u8 **srcs;
175 u8 **usrcs;
176 u8 **dsts;
177 u8 **udsts;
178 enum dma_transaction_type type;
179 wait_queue_head_t done_wait;
180 struct dmatest_done test_done;
181 bool done;
182};
183
184struct dmatest_chan {
185 struct list_head node;
186 struct dma_chan *chan;
187 struct list_head threads;
188};
189
190static DECLARE_WAIT_QUEUE_HEAD(thread_wait);
191static bool wait;
192
193static bool is_threaded_test_run(struct dmatest_info *info)
194{
195 struct dmatest_chan *dtc;
196
197 list_for_each_entry(dtc, &info->channels, node) {
198 struct dmatest_thread *thread;
199
200 list_for_each_entry(thread, &dtc->threads, node) {
201 if (!thread->done)
202 return true;
203 }
204 }
205
206 return false;
207}
208
209static int dmatest_wait_get(char *val, const struct kernel_param *kp)
210{
211 struct dmatest_info *info = &test_info;
212 struct dmatest_params *params = &info->params;
213
214 if (params->iterations)
215 wait_event(thread_wait, !is_threaded_test_run(info));
216 wait = true;
217 return param_get_bool(val, kp);
218}
219
220static const struct kernel_param_ops wait_ops = {
221 .get = dmatest_wait_get,
222 .set = param_set_bool,
223};
224module_param_cb(wait, &wait_ops, &wait, S_IRUGO);
225MODULE_PARM_DESC(wait, "Wait for tests to complete (default: false)");
226
227static bool dmatest_match_channel(struct dmatest_params *params,
228 struct dma_chan *chan)
229{
230 if (params->channel[0] == '\0')
231 return true;
232 return strcmp(dma_chan_name(chan), params->channel) == 0;
233}
234
235static bool dmatest_match_device(struct dmatest_params *params,
236 struct dma_device *device)
237{
238 if (params->device[0] == '\0')
239 return true;
240 return strcmp(dev_name(device->dev), params->device) == 0;
241}
242
243static unsigned long dmatest_random(void)
244{
245 unsigned long buf;
246
247 prandom_bytes(&buf, sizeof(buf));
248 return buf;
249}
250
251static inline u8 gen_inv_idx(u8 index, bool is_memset)
252{
253 u8 val = is_memset ? PATTERN_MEMSET_IDX : index;
254
255 return ~val & PATTERN_COUNT_MASK;
256}
257
258static inline u8 gen_src_value(u8 index, bool is_memset)
259{
260 return PATTERN_SRC | gen_inv_idx(index, is_memset);
261}
262
263static inline u8 gen_dst_value(u8 index, bool is_memset)
264{
265 return PATTERN_DST | gen_inv_idx(index, is_memset);
266}
267
268static void dmatest_init_srcs(u8 **bufs, unsigned int start, unsigned int len,
269 unsigned int buf_size, bool is_memset)
270{
271 unsigned int i;
272 u8 *buf;
273
274 for (; (buf = *bufs); bufs++) {
275 for (i = 0; i < start; i++)
276 buf[i] = gen_src_value(i, is_memset);
277 for ( ; i < start + len; i++)
278 buf[i] = gen_src_value(i, is_memset) | PATTERN_COPY;
279 for ( ; i < buf_size; i++)
280 buf[i] = gen_src_value(i, is_memset);
281 buf++;
282 }
283}
284
285static void dmatest_init_dsts(u8 **bufs, unsigned int start, unsigned int len,
286 unsigned int buf_size, bool is_memset)
287{
288 unsigned int i;
289 u8 *buf;
290
291 for (; (buf = *bufs); bufs++) {
292 for (i = 0; i < start; i++)
293 buf[i] = gen_dst_value(i, is_memset);
294 for ( ; i < start + len; i++)
295 buf[i] = gen_dst_value(i, is_memset) |
296 PATTERN_OVERWRITE;
297 for ( ; i < buf_size; i++)
298 buf[i] = gen_dst_value(i, is_memset);
299 }
300}
301
302static void dmatest_mismatch(u8 actual, u8 pattern, unsigned int index,
303 unsigned int counter, bool is_srcbuf, bool is_memset)
304{
305 u8 diff = actual ^ pattern;
306 u8 expected = pattern | gen_inv_idx(counter, is_memset);
307 const char *thread_name = current->comm;
308
309 if (is_srcbuf)
310 pr_warn("%s: srcbuf[0x%x] overwritten! Expected %02x, got %02x\n",
311 thread_name, index, expected, actual);
312 else if ((pattern & PATTERN_COPY)
313 && (diff & (PATTERN_COPY | PATTERN_OVERWRITE)))
314 pr_warn("%s: dstbuf[0x%x] not copied! Expected %02x, got %02x\n",
315 thread_name, index, expected, actual);
316 else if (diff & PATTERN_SRC)
317 pr_warn("%s: dstbuf[0x%x] was copied! Expected %02x, got %02x\n",
318 thread_name, index, expected, actual);
319 else
320 pr_warn("%s: dstbuf[0x%x] mismatch! Expected %02x, got %02x\n",
321 thread_name, index, expected, actual);
322}
323
324static unsigned int dmatest_verify(u8 **bufs, unsigned int start,
325 unsigned int end, unsigned int counter, u8 pattern,
326 bool is_srcbuf, bool is_memset)
327{
328 unsigned int i;
329 unsigned int error_count = 0;
330 u8 actual;
331 u8 expected;
332 u8 *buf;
333 unsigned int counter_orig = counter;
334
335 for (; (buf = *bufs); bufs++) {
336 counter = counter_orig;
337 for (i = start; i < end; i++) {
338 actual = buf[i];
339 expected = pattern | gen_inv_idx(counter, is_memset);
340 if (actual != expected) {
341 if (error_count < MAX_ERROR_COUNT)
342 dmatest_mismatch(actual, pattern, i,
343 counter, is_srcbuf,
344 is_memset);
345 error_count++;
346 }
347 counter++;
348 }
349 }
350
351 if (error_count > MAX_ERROR_COUNT)
352 pr_warn("%s: %u errors suppressed\n",
353 current->comm, error_count - MAX_ERROR_COUNT);
354
355 return error_count;
356}
357
358
359static void dmatest_callback(void *arg)
360{
361 struct dmatest_done *done = arg;
362 struct dmatest_thread *thread =
363 container_of(done, struct dmatest_thread, test_done);
364 if (!thread->done) {
365 done->done = true;
366 wake_up_all(done->wait);
367 } else {
368 /*
369 * If thread->done, it means that this callback occurred
370 * after the parent thread has cleaned up. This can
371 * happen in the case that driver doesn't implement
372 * the terminate_all() functionality and a dma operation
373 * did not occur within the timeout period
374 */
375 WARN(1, "dmatest: Kernel memory may be corrupted!!\n");
376 }
377}
378
379static unsigned int min_odd(unsigned int x, unsigned int y)
380{
381 unsigned int val = min(x, y);
382
383 return val % 2 ? val : val - 1;
384}
385
386static void result(const char *err, unsigned int n, unsigned int src_off,
387 unsigned int dst_off, unsigned int len, unsigned long data)
388{
389 pr_info("%s: result #%u: '%s' with src_off=0x%x dst_off=0x%x len=0x%x (%lu)\n",
390 current->comm, n, err, src_off, dst_off, len, data);
391}
392
393static void dbg_result(const char *err, unsigned int n, unsigned int src_off,
394 unsigned int dst_off, unsigned int len,
395 unsigned long data)
396{
397 pr_debug("%s: result #%u: '%s' with src_off=0x%x dst_off=0x%x len=0x%x (%lu)\n",
398 current->comm, n, err, src_off, dst_off, len, data);
399}
400
401#define verbose_result(err, n, src_off, dst_off, len, data) ({ \
402 if (verbose) \
403 result(err, n, src_off, dst_off, len, data); \
404 else \
405 dbg_result(err, n, src_off, dst_off, len, data);\
406})
407
408static unsigned long long dmatest_persec(s64 runtime, unsigned int val)
409{
410 unsigned long long per_sec = 1000000;
411
412 if (runtime <= 0)
413 return 0;
414
415 /* drop precision until runtime is 32-bits */
416 while (runtime > UINT_MAX) {
417 runtime >>= 1;
418 per_sec <<= 1;
419 }
420
421 per_sec *= val;
422 do_div(per_sec, runtime);
423 return per_sec;
424}
425
426static unsigned long long dmatest_KBs(s64 runtime, unsigned long long len)
427{
428 return dmatest_persec(runtime, len >> 10);
429}
430
431/*
432 * This function repeatedly tests DMA transfers of various lengths and
433 * offsets for a given operation type until it is told to exit by
434 * kthread_stop(). There may be multiple threads running this function
435 * in parallel for a single channel, and there may be multiple channels
436 * being tested in parallel.
437 *
438 * Before each test, the source and destination buffer is initialized
439 * with a known pattern. This pattern is different depending on
440 * whether it's in an area which is supposed to be copied or
441 * overwritten, and different in the source and destination buffers.
442 * So if the DMA engine doesn't copy exactly what we tell it to copy,
443 * we'll notice.
444 */
445static int dmatest_func(void *data)
446{
447 struct dmatest_thread *thread = data;
448 struct dmatest_done *done = &thread->test_done;
449 struct dmatest_info *info;
450 struct dmatest_params *params;
451 struct dma_chan *chan;
452 struct dma_device *dev;
453 unsigned int error_count;
454 unsigned int failed_tests = 0;
455 unsigned int total_tests = 0;
456 dma_cookie_t cookie;
457 enum dma_status status;
458 enum dma_ctrl_flags flags;
459 u8 *pq_coefs = NULL;
460 int ret;
461 int src_cnt;
462 int dst_cnt;
463 int i;
464 ktime_t ktime, start, diff;
465 ktime_t filltime = 0;
466 ktime_t comparetime = 0;
467 s64 runtime = 0;
468 unsigned long long total_len = 0;
469 u8 align = 0;
470 bool is_memset = false;
471
472 set_freezable();
473
474 ret = -ENOMEM;
475
476 smp_rmb();
477 info = thread->info;
478 params = &info->params;
479 chan = thread->chan;
480 dev = chan->device;
481 if (thread->type == DMA_MEMCPY) {
482 align = dev->copy_align;
483 src_cnt = dst_cnt = 1;
484 } else if (thread->type == DMA_MEMSET) {
485 align = dev->fill_align;
486 src_cnt = dst_cnt = 1;
487 is_memset = true;
488 } else if (thread->type == DMA_XOR) {
489 /* force odd to ensure dst = src */
490 src_cnt = min_odd(params->xor_sources | 1, dev->max_xor);
491 dst_cnt = 1;
492 align = dev->xor_align;
493 } else if (thread->type == DMA_PQ) {
494 /* force odd to ensure dst = src */
495 src_cnt = min_odd(params->pq_sources | 1, dma_maxpq(dev, 0));
496 dst_cnt = 2;
497 align = dev->pq_align;
498
499 pq_coefs = kmalloc(params->pq_sources + 1, GFP_KERNEL);
500 if (!pq_coefs)
501 goto err_thread_type;
502
503 for (i = 0; i < src_cnt; i++)
504 pq_coefs[i] = 1;
505 } else
506 goto err_thread_type;
507
508 thread->srcs = kcalloc(src_cnt + 1, sizeof(u8 *), GFP_KERNEL);
509 if (!thread->srcs)
510 goto err_srcs;
511
512 thread->usrcs = kcalloc(src_cnt + 1, sizeof(u8 *), GFP_KERNEL);
513 if (!thread->usrcs)
514 goto err_usrcs;
515
516 for (i = 0; i < src_cnt; i++) {
517 thread->usrcs[i] = kmalloc(params->buf_size + align,
518 GFP_KERNEL);
519 if (!thread->usrcs[i])
520 goto err_srcbuf;
521
522 /* align srcs to alignment restriction */
523 if (align)
524 thread->srcs[i] = PTR_ALIGN(thread->usrcs[i], align);
525 else
526 thread->srcs[i] = thread->usrcs[i];
527 }
528 thread->srcs[i] = NULL;
529
530 thread->dsts = kcalloc(dst_cnt + 1, sizeof(u8 *), GFP_KERNEL);
531 if (!thread->dsts)
532 goto err_dsts;
533
534 thread->udsts = kcalloc(dst_cnt + 1, sizeof(u8 *), GFP_KERNEL);
535 if (!thread->udsts)
536 goto err_udsts;
537
538 for (i = 0; i < dst_cnt; i++) {
539 thread->udsts[i] = kmalloc(params->buf_size + align,
540 GFP_KERNEL);
541 if (!thread->udsts[i])
542 goto err_dstbuf;
543
544 /* align dsts to alignment restriction */
545 if (align)
546 thread->dsts[i] = PTR_ALIGN(thread->udsts[i], align);
547 else
548 thread->dsts[i] = thread->udsts[i];
549 }
550 thread->dsts[i] = NULL;
551
552 set_user_nice(current, 10);
553
554 /*
555 * src and dst buffers are freed by ourselves below
556 */
557 flags = DMA_CTRL_ACK | DMA_PREP_INTERRUPT;
558
559 ktime = ktime_get();
560 while (!kthread_should_stop()
561 && !(params->iterations && total_tests >= params->iterations)) {
562 struct dma_async_tx_descriptor *tx = NULL;
563 struct dmaengine_unmap_data *um;
564 dma_addr_t srcs[src_cnt];
565 dma_addr_t *dsts;
566 unsigned int src_off, dst_off, len;
567
568 total_tests++;
569
570 /* Check if buffer count fits into map count variable (u8) */
571 if ((src_cnt + dst_cnt) >= 255) {
572 pr_err("too many buffers (%d of 255 supported)\n",
573 src_cnt + dst_cnt);
574 break;
575 }
576
577 if (1 << align > params->buf_size) {
578 pr_err("%u-byte buffer too small for %d-byte alignment\n",
579 params->buf_size, 1 << align);
580 break;
581 }
582
583 if (params->norandom)
584 len = params->buf_size;
585 else
586 len = dmatest_random() % params->buf_size + 1;
587
588 len = (len >> align) << align;
589 if (!len)
590 len = 1 << align;
591
592 total_len += len;
593
594 if (params->norandom) {
595 src_off = 0;
596 dst_off = 0;
597 } else {
598 src_off = dmatest_random() % (params->buf_size - len + 1);
599 dst_off = dmatest_random() % (params->buf_size - len + 1);
600
601 src_off = (src_off >> align) << align;
602 dst_off = (dst_off >> align) << align;
603 }
604
605 if (!params->noverify) {
606 start = ktime_get();
607 dmatest_init_srcs(thread->srcs, src_off, len,
608 params->buf_size, is_memset);
609 dmatest_init_dsts(thread->dsts, dst_off, len,
610 params->buf_size, is_memset);
611
612 diff = ktime_sub(ktime_get(), start);
613 filltime = ktime_add(filltime, diff);
614 }
615
616 um = dmaengine_get_unmap_data(dev->dev, src_cnt + dst_cnt,
617 GFP_KERNEL);
618 if (!um) {
619 failed_tests++;
620 result("unmap data NULL", total_tests,
621 src_off, dst_off, len, ret);
622 continue;
623 }
624
625 um->len = params->buf_size;
626 for (i = 0; i < src_cnt; i++) {
627 void *buf = thread->srcs[i];
628 struct page *pg = virt_to_page(buf);
629 unsigned long pg_off = offset_in_page(buf);
630
631 um->addr[i] = dma_map_page(dev->dev, pg, pg_off,
632 um->len, DMA_TO_DEVICE);
633 srcs[i] = um->addr[i] + src_off;
634 ret = dma_mapping_error(dev->dev, um->addr[i]);
635 if (ret) {
636 dmaengine_unmap_put(um);
637 result("src mapping error", total_tests,
638 src_off, dst_off, len, ret);
639 failed_tests++;
640 continue;
641 }
642 um->to_cnt++;
643 }
644 /* map with DMA_BIDIRECTIONAL to force writeback/invalidate */
645 dsts = &um->addr[src_cnt];
646 for (i = 0; i < dst_cnt; i++) {
647 void *buf = thread->dsts[i];
648 struct page *pg = virt_to_page(buf);
649 unsigned long pg_off = offset_in_page(buf);
650
651 dsts[i] = dma_map_page(dev->dev, pg, pg_off, um->len,
652 DMA_BIDIRECTIONAL);
653 ret = dma_mapping_error(dev->dev, dsts[i]);
654 if (ret) {
655 dmaengine_unmap_put(um);
656 result("dst mapping error", total_tests,
657 src_off, dst_off, len, ret);
658 failed_tests++;
659 continue;
660 }
661 um->bidi_cnt++;
662 }
663
664 if (thread->type == DMA_MEMCPY)
665 tx = dev->device_prep_dma_memcpy(chan,
666 dsts[0] + dst_off,
667 srcs[0], len, flags);
668 else if (thread->type == DMA_MEMSET)
669 tx = dev->device_prep_dma_memset(chan,
670 dsts[0] + dst_off,
671 *(thread->srcs[0] + src_off),
672 len, flags);
673 else if (thread->type == DMA_XOR)
674 tx = dev->device_prep_dma_xor(chan,
675 dsts[0] + dst_off,
676 srcs, src_cnt,
677 len, flags);
678 else if (thread->type == DMA_PQ) {
679 dma_addr_t dma_pq[dst_cnt];
680
681 for (i = 0; i < dst_cnt; i++)
682 dma_pq[i] = dsts[i] + dst_off;
683 tx = dev->device_prep_dma_pq(chan, dma_pq, srcs,
684 src_cnt, pq_coefs,
685 len, flags);
686 }
687
688 if (!tx) {
689 dmaengine_unmap_put(um);
690 result("prep error", total_tests, src_off,
691 dst_off, len, ret);
692 msleep(100);
693 failed_tests++;
694 continue;
695 }
696
697 done->done = false;
698 tx->callback = dmatest_callback;
699 tx->callback_param = done;
700 cookie = tx->tx_submit(tx);
701
702 if (dma_submit_error(cookie)) {
703 dmaengine_unmap_put(um);
704 result("submit error", total_tests, src_off,
705 dst_off, len, ret);
706 msleep(100);
707 failed_tests++;
708 continue;
709 }
710 dma_async_issue_pending(chan);
711
712 wait_event_freezable_timeout(thread->done_wait, done->done,
713 msecs_to_jiffies(params->timeout));
714
715 status = dma_async_is_tx_complete(chan, cookie, NULL, NULL);
716
717 if (!done->done) {
718 dmaengine_unmap_put(um);
719 result("test timed out", total_tests, src_off, dst_off,
720 len, 0);
721 failed_tests++;
722 continue;
723 } else if (status != DMA_COMPLETE) {
724 dmaengine_unmap_put(um);
725 result(status == DMA_ERROR ?
726 "completion error status" :
727 "completion busy status", total_tests, src_off,
728 dst_off, len, ret);
729 failed_tests++;
730 continue;
731 }
732
733 dmaengine_unmap_put(um);
734
735 if (params->noverify) {
736 verbose_result("test passed", total_tests, src_off,
737 dst_off, len, 0);
738 continue;
739 }
740
741 start = ktime_get();
742 pr_debug("%s: verifying source buffer...\n", current->comm);
743 error_count = dmatest_verify(thread->srcs, 0, src_off,
744 0, PATTERN_SRC, true, is_memset);
745 error_count += dmatest_verify(thread->srcs, src_off,
746 src_off + len, src_off,
747 PATTERN_SRC | PATTERN_COPY, true, is_memset);
748 error_count += dmatest_verify(thread->srcs, src_off + len,
749 params->buf_size, src_off + len,
750 PATTERN_SRC, true, is_memset);
751
752 pr_debug("%s: verifying dest buffer...\n", current->comm);
753 error_count += dmatest_verify(thread->dsts, 0, dst_off,
754 0, PATTERN_DST, false, is_memset);
755
756 error_count += dmatest_verify(thread->dsts, dst_off,
757 dst_off + len, src_off,
758 PATTERN_SRC | PATTERN_COPY, false, is_memset);
759
760 error_count += dmatest_verify(thread->dsts, dst_off + len,
761 params->buf_size, dst_off + len,
762 PATTERN_DST, false, is_memset);
763
764 diff = ktime_sub(ktime_get(), start);
765 comparetime = ktime_add(comparetime, diff);
766
767 if (error_count) {
768 result("data error", total_tests, src_off, dst_off,
769 len, error_count);
770 failed_tests++;
771 } else {
772 verbose_result("test passed", total_tests, src_off,
773 dst_off, len, 0);
774 }
775 }
776 ktime = ktime_sub(ktime_get(), ktime);
777 ktime = ktime_sub(ktime, comparetime);
778 ktime = ktime_sub(ktime, filltime);
779 runtime = ktime_to_us(ktime);
780
781 ret = 0;
782err_dstbuf:
783 for (i = 0; thread->udsts[i]; i++)
784 kfree(thread->udsts[i]);
785 kfree(thread->udsts);
786err_udsts:
787 kfree(thread->dsts);
788err_dsts:
789err_srcbuf:
790 for (i = 0; thread->usrcs[i]; i++)
791 kfree(thread->usrcs[i]);
792 kfree(thread->usrcs);
793err_usrcs:
794 kfree(thread->srcs);
795err_srcs:
796 kfree(pq_coefs);
797err_thread_type:
798 pr_info("%s: summary %u tests, %u failures %llu iops %llu KB/s (%d)\n",
799 current->comm, total_tests, failed_tests,
800 dmatest_persec(runtime, total_tests),
801 dmatest_KBs(runtime, total_len), ret);
802
803 /* terminate all transfers on specified channels */
804 if (ret || failed_tests)
805 dmaengine_terminate_all(chan);
806
807 thread->done = true;
808 wake_up(&thread_wait);
809
810 return ret;
811}
812
813static void dmatest_cleanup_channel(struct dmatest_chan *dtc)
814{
815 struct dmatest_thread *thread;
816 struct dmatest_thread *_thread;
817 int ret;
818
819 list_for_each_entry_safe(thread, _thread, &dtc->threads, node) {
820 ret = kthread_stop(thread->task);
821 pr_debug("thread %s exited with status %d\n",
822 thread->task->comm, ret);
823 list_del(&thread->node);
824 put_task_struct(thread->task);
825 kfree(thread);
826 }
827
828 /* terminate all transfers on specified channels */
829 dmaengine_terminate_all(dtc->chan);
830
831 kfree(dtc);
832}
833
834static int dmatest_add_threads(struct dmatest_info *info,
835 struct dmatest_chan *dtc, enum dma_transaction_type type)
836{
837 struct dmatest_params *params = &info->params;
838 struct dmatest_thread *thread;
839 struct dma_chan *chan = dtc->chan;
840 char *op;
841 unsigned int i;
842
843 if (type == DMA_MEMCPY)
844 op = "copy";
845 else if (type == DMA_MEMSET)
846 op = "set";
847 else if (type == DMA_XOR)
848 op = "xor";
849 else if (type == DMA_PQ)
850 op = "pq";
851 else
852 return -EINVAL;
853
854 for (i = 0; i < params->threads_per_chan; i++) {
855 thread = kzalloc(sizeof(struct dmatest_thread), GFP_KERNEL);
856 if (!thread) {
857 pr_warn("No memory for %s-%s%u\n",
858 dma_chan_name(chan), op, i);
859 break;
860 }
861 thread->info = info;
862 thread->chan = dtc->chan;
863 thread->type = type;
864 thread->test_done.wait = &thread->done_wait;
865 init_waitqueue_head(&thread->done_wait);
866 smp_wmb();
867 thread->task = kthread_create(dmatest_func, thread, "%s-%s%u",
868 dma_chan_name(chan), op, i);
869 if (IS_ERR(thread->task)) {
870 pr_warn("Failed to create thread %s-%s%u\n",
871 dma_chan_name(chan), op, i);
872 kfree(thread);
873 break;
874 }
875
876 /* srcbuf and dstbuf are allocated by the thread itself */
877 get_task_struct(thread->task);
878 list_add_tail(&thread->node, &dtc->threads);
879 wake_up_process(thread->task);
880 }
881
882 return i;
883}
884
885static int dmatest_add_channel(struct dmatest_info *info,
886 struct dma_chan *chan)
887{
888 struct dmatest_chan *dtc;
889 struct dma_device *dma_dev = chan->device;
890 unsigned int thread_count = 0;
891 int cnt;
892
893 dtc = kmalloc(sizeof(struct dmatest_chan), GFP_KERNEL);
894 if (!dtc) {
895 pr_warn("No memory for %s\n", dma_chan_name(chan));
896 return -ENOMEM;
897 }
898
899 dtc->chan = chan;
900 INIT_LIST_HEAD(&dtc->threads);
901
902 if (dma_has_cap(DMA_MEMCPY, dma_dev->cap_mask)) {
903 if (dmatest == 0) {
904 cnt = dmatest_add_threads(info, dtc, DMA_MEMCPY);
905 thread_count += cnt > 0 ? cnt : 0;
906 }
907 }
908
909 if (dma_has_cap(DMA_MEMSET, dma_dev->cap_mask)) {
910 if (dmatest == 1) {
911 cnt = dmatest_add_threads(info, dtc, DMA_MEMSET);
912 thread_count += cnt > 0 ? cnt : 0;
913 }
914 }
915
916 if (dma_has_cap(DMA_XOR, dma_dev->cap_mask)) {
917 cnt = dmatest_add_threads(info, dtc, DMA_XOR);
918 thread_count += cnt > 0 ? cnt : 0;
919 }
920 if (dma_has_cap(DMA_PQ, dma_dev->cap_mask)) {
921 cnt = dmatest_add_threads(info, dtc, DMA_PQ);
922 thread_count += cnt > 0 ? cnt : 0;
923 }
924
925 pr_info("Started %u threads using %s\n",
926 thread_count, dma_chan_name(chan));
927
928 list_add_tail(&dtc->node, &info->channels);
929 info->nr_channels++;
930
931 return 0;
932}
933
934static bool filter(struct dma_chan *chan, void *param)
935{
936 struct dmatest_params *params = param;
937
938 if (!dmatest_match_channel(params, chan) ||
939 !dmatest_match_device(params, chan->device))
940 return false;
941 else
942 return true;
943}
944
945static void request_channels(struct dmatest_info *info,
946 enum dma_transaction_type type)
947{
948 dma_cap_mask_t mask;
949
950 dma_cap_zero(mask);
951 dma_cap_set(type, mask);
952 for (;;) {
953 struct dmatest_params *params = &info->params;
954 struct dma_chan *chan;
955
956 chan = dma_request_channel(mask, filter, params);
957 if (chan) {
958 if (dmatest_add_channel(info, chan)) {
959 dma_release_channel(chan);
960 break; /* add_channel failed, punt */
961 }
962 } else
963 break; /* no more channels available */
964 if (params->max_channels &&
965 info->nr_channels >= params->max_channels)
966 break; /* we have all we need */
967 }
968}
969
970static void run_threaded_test(struct dmatest_info *info)
971{
972 struct dmatest_params *params = &info->params;
973
974 /* Copy test parameters */
975 params->buf_size = test_buf_size;
976 strlcpy(params->channel, strim(test_channel), sizeof(params->channel));
977 strlcpy(params->device, strim(test_device), sizeof(params->device));
978 params->threads_per_chan = threads_per_chan;
979 params->max_channels = max_channels;
980 params->iterations = iterations;
981 params->xor_sources = xor_sources;
982 params->pq_sources = pq_sources;
983 params->timeout = timeout;
984 params->noverify = noverify;
985 params->norandom = norandom;
986
987 request_channels(info, DMA_MEMCPY);
988 request_channels(info, DMA_MEMSET);
989 request_channels(info, DMA_XOR);
990 request_channels(info, DMA_PQ);
991}
992
993static void stop_threaded_test(struct dmatest_info *info)
994{
995 struct dmatest_chan *dtc, *_dtc;
996 struct dma_chan *chan;
997
998 list_for_each_entry_safe(dtc, _dtc, &info->channels, node) {
999 list_del(&dtc->node);
1000 chan = dtc->chan;
1001 dmatest_cleanup_channel(dtc);
1002 pr_debug("dropped channel %s\n", dma_chan_name(chan));
1003 dma_release_channel(chan);
1004 }
1005
1006 info->nr_channels = 0;
1007}
1008
1009static void restart_threaded_test(struct dmatest_info *info, bool run)
1010{
1011 /* we might be called early to set run=, defer running until all
1012 * parameters have been evaluated
1013 */
1014 if (!info->did_init)
1015 return;
1016
1017 /* Stop any running test first */
1018 stop_threaded_test(info);
1019
1020 /* Run test with new parameters */
1021 run_threaded_test(info);
1022}
1023
1024static int dmatest_run_get(char *val, const struct kernel_param *kp)
1025{
1026 struct dmatest_info *info = &test_info;
1027
1028 mutex_lock(&info->lock);
1029 if (is_threaded_test_run(info)) {
1030 dmatest_run = true;
1031 } else {
1032 stop_threaded_test(info);
1033 dmatest_run = false;
1034 }
1035 mutex_unlock(&info->lock);
1036
1037 return param_get_bool(val, kp);
1038}
1039
1040static int dmatest_run_set(const char *val, const struct kernel_param *kp)
1041{
1042 struct dmatest_info *info = &test_info;
1043 int ret;
1044
1045 mutex_lock(&info->lock);
1046 ret = param_set_bool(val, kp);
1047 if (ret) {
1048 mutex_unlock(&info->lock);
1049 return ret;
1050 }
1051
1052 if (is_threaded_test_run(info))
1053 ret = -EBUSY;
1054 else if (dmatest_run)
1055 restart_threaded_test(info, dmatest_run);
1056
1057 mutex_unlock(&info->lock);
1058
1059 return ret;
1060}
1061
1062static int __init dmatest_init(void)
1063{
1064 struct dmatest_info *info = &test_info;
1065 struct dmatest_params *params = &info->params;
1066
1067 if (dmatest_run) {
1068 mutex_lock(&info->lock);
1069 run_threaded_test(info);
1070 mutex_unlock(&info->lock);
1071 }
1072
1073 if (params->iterations && wait)
1074 wait_event(thread_wait, !is_threaded_test_run(info));
1075
1076 /* module parameters are stable, inittime tests are started,
1077 * let userspace take over 'run' control
1078 */
1079 info->did_init = true;
1080
1081 return 0;
1082}
1083/* when compiled-in wait for drivers to load first */
1084late_initcall(dmatest_init);
1085
1086static void __exit dmatest_exit(void)
1087{
1088 struct dmatest_info *info = &test_info;
1089
1090 mutex_lock(&info->lock);
1091 stop_threaded_test(info);
1092 mutex_unlock(&info->lock);
1093}
1094module_exit(dmatest_exit);
1095
1096MODULE_AUTHOR("Haavard Skinnemoen (Atmel)");
1097MODULE_LICENSE("GPL v2");