162306a36Sopenharmony_ci// SPDX-License-Identifier: GPL-2.0-only
262306a36Sopenharmony_ci/*
362306a36Sopenharmony_ci * Copyright (C) 2020 HiSilicon Limited.
462306a36Sopenharmony_ci */
562306a36Sopenharmony_ci
662306a36Sopenharmony_ci#include <fcntl.h>
762306a36Sopenharmony_ci#include <stdio.h>
862306a36Sopenharmony_ci#include <stdlib.h>
962306a36Sopenharmony_ci#include <string.h>
1062306a36Sopenharmony_ci#include <unistd.h>
1162306a36Sopenharmony_ci#include <sys/ioctl.h>
1262306a36Sopenharmony_ci#include <sys/mman.h>
1362306a36Sopenharmony_ci#include <linux/types.h>
1462306a36Sopenharmony_ci#include <linux/map_benchmark.h>
1562306a36Sopenharmony_ci
1662306a36Sopenharmony_ci#define NSEC_PER_MSEC	1000000L
1762306a36Sopenharmony_ci
1862306a36Sopenharmony_cistatic char *directions[] = {
1962306a36Sopenharmony_ci	"BIDIRECTIONAL",
2062306a36Sopenharmony_ci	"TO_DEVICE",
2162306a36Sopenharmony_ci	"FROM_DEVICE",
2262306a36Sopenharmony_ci};
2362306a36Sopenharmony_ci
2462306a36Sopenharmony_ciint main(int argc, char **argv)
2562306a36Sopenharmony_ci{
2662306a36Sopenharmony_ci	struct map_benchmark map;
2762306a36Sopenharmony_ci	int fd, opt;
2862306a36Sopenharmony_ci	/* default single thread, run 20 seconds on NUMA_NO_NODE */
2962306a36Sopenharmony_ci	int threads = 1, seconds = 20, node = -1;
3062306a36Sopenharmony_ci	/* default dma mask 32bit, bidirectional DMA */
3162306a36Sopenharmony_ci	int bits = 32, xdelay = 0, dir = DMA_MAP_BIDIRECTIONAL;
3262306a36Sopenharmony_ci	/* default granule 1 PAGESIZE */
3362306a36Sopenharmony_ci	int granule = 1;
3462306a36Sopenharmony_ci
3562306a36Sopenharmony_ci	int cmd = DMA_MAP_BENCHMARK;
3662306a36Sopenharmony_ci	char *p;
3762306a36Sopenharmony_ci
3862306a36Sopenharmony_ci	while ((opt = getopt(argc, argv, "t:s:n:b:d:x:g:")) != -1) {
3962306a36Sopenharmony_ci		switch (opt) {
4062306a36Sopenharmony_ci		case 't':
4162306a36Sopenharmony_ci			threads = atoi(optarg);
4262306a36Sopenharmony_ci			break;
4362306a36Sopenharmony_ci		case 's':
4462306a36Sopenharmony_ci			seconds = atoi(optarg);
4562306a36Sopenharmony_ci			break;
4662306a36Sopenharmony_ci		case 'n':
4762306a36Sopenharmony_ci			node = atoi(optarg);
4862306a36Sopenharmony_ci			break;
4962306a36Sopenharmony_ci		case 'b':
5062306a36Sopenharmony_ci			bits = atoi(optarg);
5162306a36Sopenharmony_ci			break;
5262306a36Sopenharmony_ci		case 'd':
5362306a36Sopenharmony_ci			dir = atoi(optarg);
5462306a36Sopenharmony_ci			break;
5562306a36Sopenharmony_ci		case 'x':
5662306a36Sopenharmony_ci			xdelay = atoi(optarg);
5762306a36Sopenharmony_ci			break;
5862306a36Sopenharmony_ci		case 'g':
5962306a36Sopenharmony_ci			granule = atoi(optarg);
6062306a36Sopenharmony_ci			break;
6162306a36Sopenharmony_ci		default:
6262306a36Sopenharmony_ci			return -1;
6362306a36Sopenharmony_ci		}
6462306a36Sopenharmony_ci	}
6562306a36Sopenharmony_ci
6662306a36Sopenharmony_ci	if (threads <= 0 || threads > DMA_MAP_MAX_THREADS) {
6762306a36Sopenharmony_ci		fprintf(stderr, "invalid number of threads, must be in 1-%d\n",
6862306a36Sopenharmony_ci			DMA_MAP_MAX_THREADS);
6962306a36Sopenharmony_ci		exit(1);
7062306a36Sopenharmony_ci	}
7162306a36Sopenharmony_ci
7262306a36Sopenharmony_ci	if (seconds <= 0 || seconds > DMA_MAP_MAX_SECONDS) {
7362306a36Sopenharmony_ci		fprintf(stderr, "invalid number of seconds, must be in 1-%d\n",
7462306a36Sopenharmony_ci			DMA_MAP_MAX_SECONDS);
7562306a36Sopenharmony_ci		exit(1);
7662306a36Sopenharmony_ci	}
7762306a36Sopenharmony_ci
7862306a36Sopenharmony_ci	if (xdelay < 0 || xdelay > DMA_MAP_MAX_TRANS_DELAY) {
7962306a36Sopenharmony_ci		fprintf(stderr, "invalid transmit delay, must be in 0-%ld\n",
8062306a36Sopenharmony_ci			DMA_MAP_MAX_TRANS_DELAY);
8162306a36Sopenharmony_ci		exit(1);
8262306a36Sopenharmony_ci	}
8362306a36Sopenharmony_ci
8462306a36Sopenharmony_ci	/* suppose the mininum DMA zone is 1MB in the world */
8562306a36Sopenharmony_ci	if (bits < 20 || bits > 64) {
8662306a36Sopenharmony_ci		fprintf(stderr, "invalid dma mask bit, must be in 20-64\n");
8762306a36Sopenharmony_ci		exit(1);
8862306a36Sopenharmony_ci	}
8962306a36Sopenharmony_ci
9062306a36Sopenharmony_ci	if (dir != DMA_MAP_BIDIRECTIONAL && dir != DMA_MAP_TO_DEVICE &&
9162306a36Sopenharmony_ci			dir != DMA_MAP_FROM_DEVICE) {
9262306a36Sopenharmony_ci		fprintf(stderr, "invalid dma direction\n");
9362306a36Sopenharmony_ci		exit(1);
9462306a36Sopenharmony_ci	}
9562306a36Sopenharmony_ci
9662306a36Sopenharmony_ci	if (granule < 1 || granule > 1024) {
9762306a36Sopenharmony_ci		fprintf(stderr, "invalid granule size\n");
9862306a36Sopenharmony_ci		exit(1);
9962306a36Sopenharmony_ci	}
10062306a36Sopenharmony_ci
10162306a36Sopenharmony_ci	fd = open("/sys/kernel/debug/dma_map_benchmark", O_RDWR);
10262306a36Sopenharmony_ci	if (fd == -1) {
10362306a36Sopenharmony_ci		perror("open");
10462306a36Sopenharmony_ci		exit(1);
10562306a36Sopenharmony_ci	}
10662306a36Sopenharmony_ci
10762306a36Sopenharmony_ci	memset(&map, 0, sizeof(map));
10862306a36Sopenharmony_ci	map.seconds = seconds;
10962306a36Sopenharmony_ci	map.threads = threads;
11062306a36Sopenharmony_ci	map.node = node;
11162306a36Sopenharmony_ci	map.dma_bits = bits;
11262306a36Sopenharmony_ci	map.dma_dir = dir;
11362306a36Sopenharmony_ci	map.dma_trans_ns = xdelay;
11462306a36Sopenharmony_ci	map.granule = granule;
11562306a36Sopenharmony_ci
11662306a36Sopenharmony_ci	if (ioctl(fd, cmd, &map)) {
11762306a36Sopenharmony_ci		perror("ioctl");
11862306a36Sopenharmony_ci		exit(1);
11962306a36Sopenharmony_ci	}
12062306a36Sopenharmony_ci
12162306a36Sopenharmony_ci	printf("dma mapping benchmark: threads:%d seconds:%d node:%d dir:%s granule: %d\n",
12262306a36Sopenharmony_ci			threads, seconds, node, dir[directions], granule);
12362306a36Sopenharmony_ci	printf("average map latency(us):%.1f standard deviation:%.1f\n",
12462306a36Sopenharmony_ci			map.avg_map_100ns/10.0, map.map_stddev/10.0);
12562306a36Sopenharmony_ci	printf("average unmap latency(us):%.1f standard deviation:%.1f\n",
12662306a36Sopenharmony_ci			map.avg_unmap_100ns/10.0, map.unmap_stddev/10.0);
12762306a36Sopenharmony_ci
12862306a36Sopenharmony_ci	return 0;
12962306a36Sopenharmony_ci}
130