mirror of
				git://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git
				synced 2025-09-04 20:19:47 +08:00 
			
		
		
		
	 647c734f62
			
		
	
	
		647c734f62
		
	
	
	
	
		
			
			Add a compression testcase for the powerpc NX-GZIP engine. Signed-off-by: Bulent Abali <abali@us.ibm.com> Signed-off-by: Raphael Moreira Zinsly <rzinsly@linux.ibm.com> Signed-off-by: Michael Ellerman <mpe@ellerman.id.au> Link: https://lore.kernel.org/r/20200420205538.25181-4-rzinsly@linux.ibm.com
		
			
				
	
	
		
			317 lines
		
	
	
		
			6.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			317 lines
		
	
	
		
			6.3 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| // SPDX-License-Identifier: GPL-2.0-or-later
 | |
| 
 | |
| /*
 | |
|  * Copyright 2020 IBM Corp.
 | |
|  *
 | |
|  * Author: Bulent Abali <abali@us.ibm.com>
 | |
|  *
 | |
|  */
 | |
| #include <stdio.h>
 | |
| #include <stdlib.h>
 | |
| #include <string.h>
 | |
| #include <unistd.h>
 | |
| #include <stdint.h>
 | |
| #include <sys/types.h>
 | |
| #include <sys/stat.h>
 | |
| #include <sys/time.h>
 | |
| #include <sys/fcntl.h>
 | |
| #include <sys/mman.h>
 | |
| #include <endian.h>
 | |
| #include <bits/endian.h>
 | |
| #include <sys/ioctl.h>
 | |
| #include <assert.h>
 | |
| #include <errno.h>
 | |
| #include <signal.h>
 | |
| #include "vas-api.h"
 | |
| #include "nx.h"
 | |
| #include "copy-paste.h"
 | |
| #include "nxu.h"
 | |
| #include "nx_dbg.h"
 | |
| #include <sys/platform/ppc.h>
 | |
| 
 | |
| #define barrier()
 | |
| #define hwsync()    ({ asm volatile("sync" ::: "memory"); })
 | |
| 
 | |
| #ifndef NX_NO_CPU_PRI
 | |
| #define cpu_pri_default()  ({ asm volatile ("or 2, 2, 2"); })
 | |
| #define cpu_pri_low()      ({ asm volatile ("or 31, 31, 31"); })
 | |
| #else
 | |
| #define cpu_pri_default()
 | |
| #define cpu_pri_low()
 | |
| #endif
 | |
| 
 | |
| void *nx_fault_storage_address;
 | |
| 
 | |
| struct nx_handle {
 | |
| 	int fd;
 | |
| 	int function;
 | |
| 	void *paste_addr;
 | |
| };
 | |
| 
 | |
| static int open_device_nodes(char *devname, int pri, struct nx_handle *handle)
 | |
| {
 | |
| 	int rc, fd;
 | |
| 	void *addr;
 | |
| 	struct vas_tx_win_open_attr txattr;
 | |
| 
 | |
| 	fd = open(devname, O_RDWR);
 | |
| 	if (fd < 0) {
 | |
| 		fprintf(stderr, " open device name %s\n", devname);
 | |
| 		return -errno;
 | |
| 	}
 | |
| 
 | |
| 	memset(&txattr, 0, sizeof(txattr));
 | |
| 	txattr.version = 1;
 | |
| 	txattr.vas_id = pri;
 | |
| 	rc = ioctl(fd, VAS_TX_WIN_OPEN, (unsigned long)&txattr);
 | |
| 	if (rc < 0) {
 | |
| 		fprintf(stderr, "ioctl() n %d, error %d\n", rc, errno);
 | |
| 		rc = -errno;
 | |
| 		goto out;
 | |
| 	}
 | |
| 
 | |
| 	addr = mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0ULL);
 | |
| 	if (addr == MAP_FAILED) {
 | |
| 		fprintf(stderr, "mmap() failed, errno %d\n", errno);
 | |
| 		rc = -errno;
 | |
| 		goto out;
 | |
| 	}
 | |
| 	handle->fd = fd;
 | |
| 	handle->paste_addr = (void *)((char *)addr + 0x400);
 | |
| 
 | |
| 	rc = 0;
 | |
| out:
 | |
| 	close(fd);
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| void *nx_function_begin(int function, int pri)
 | |
| {
 | |
| 	int rc;
 | |
| 	char *devname = "/dev/crypto/nx-gzip";
 | |
| 	struct nx_handle *nxhandle;
 | |
| 
 | |
| 	if (function != NX_FUNC_COMP_GZIP) {
 | |
| 		errno = EINVAL;
 | |
| 		fprintf(stderr, " NX_FUNC_COMP_GZIP not found\n");
 | |
| 		return NULL;
 | |
| 	}
 | |
| 
 | |
| 
 | |
| 	nxhandle = malloc(sizeof(*nxhandle));
 | |
| 	if (!nxhandle) {
 | |
| 		errno = ENOMEM;
 | |
| 		fprintf(stderr, " No memory\n");
 | |
| 		return NULL;
 | |
| 	}
 | |
| 
 | |
| 	nxhandle->function = function;
 | |
| 	rc = open_device_nodes(devname, pri, nxhandle);
 | |
| 	if (rc < 0) {
 | |
| 		errno = -rc;
 | |
| 		fprintf(stderr, " open_device_nodes failed\n");
 | |
| 		return NULL;
 | |
| 	}
 | |
| 
 | |
| 	return nxhandle;
 | |
| }
 | |
| 
 | |
| int nx_function_end(void *handle)
 | |
| {
 | |
| 	int rc = 0;
 | |
| 	struct nx_handle *nxhandle = handle;
 | |
| 
 | |
| 	rc = munmap(nxhandle->paste_addr - 0x400, 4096);
 | |
| 	if (rc < 0) {
 | |
| 		fprintf(stderr, "munmap() failed, errno %d\n", errno);
 | |
| 		return rc;
 | |
| 	}
 | |
| 	close(nxhandle->fd);
 | |
| 	free(nxhandle);
 | |
| 
 | |
| 	return rc;
 | |
| }
 | |
| 
 | |
| static int nx_wait_for_csb(struct nx_gzip_crb_cpb_t *cmdp)
 | |
| {
 | |
| 	long poll = 0;
 | |
| 	uint64_t t;
 | |
| 
 | |
| 	/* Save power and let other threads use the h/w. top may show
 | |
| 	 * 100% but only because OS doesn't know we slowed the this
 | |
| 	 * h/w thread while polling. We're letting other threads have
 | |
| 	 * higher throughput on the core.
 | |
| 	 */
 | |
| 	cpu_pri_low();
 | |
| 
 | |
| #define CSB_MAX_POLL 200000000UL
 | |
| #define USLEEP_TH     300000UL
 | |
| 
 | |
| 	t = __ppc_get_timebase();
 | |
| 
 | |
| 	while (getnn(cmdp->crb.csb, csb_v) == 0) {
 | |
| 		++poll;
 | |
| 		hwsync();
 | |
| 
 | |
| 		cpu_pri_low();
 | |
| 
 | |
| 		/* usleep(0) takes around 29000 ticks ~60 us.
 | |
| 		 * 300000 is spinning for about 600 us then
 | |
| 		 * start sleeping.
 | |
| 		 */
 | |
| 		if ((__ppc_get_timebase() - t) > USLEEP_TH) {
 | |
| 			cpu_pri_default();
 | |
| 			usleep(1);
 | |
| 		}
 | |
| 
 | |
| 		if (poll > CSB_MAX_POLL)
 | |
| 			break;
 | |
| 
 | |
| 		/* Fault address from signal handler */
 | |
| 		if (nx_fault_storage_address) {
 | |
| 			cpu_pri_default();
 | |
| 			return -EAGAIN;
 | |
| 		}
 | |
| 
 | |
| 	}
 | |
| 
 | |
| 	cpu_pri_default();
 | |
| 
 | |
| 	/* hw has updated csb and output buffer */
 | |
| 	hwsync();
 | |
| 
 | |
| 	/* Check CSB flags. */
 | |
| 	if (getnn(cmdp->crb.csb, csb_v) == 0) {
 | |
| 		fprintf(stderr, "CSB still not valid after %d polls.\n",
 | |
| 			(int) poll);
 | |
| 		prt_err("CSB still not valid after %d polls, giving up.\n",
 | |
| 			(int) poll);
 | |
| 		return -ETIMEDOUT;
 | |
| 	}
 | |
| 
 | |
| 	return 0;
 | |
| }
 | |
| 
 | |
| static int nxu_run_job(struct nx_gzip_crb_cpb_t *cmdp, void *handle)
 | |
| {
 | |
| 	int i, ret, retries;
 | |
| 	struct nx_handle *nxhandle = handle;
 | |
| 
 | |
| 	assert(handle != NULL);
 | |
| 	i = 0;
 | |
| 	retries = 5000;
 | |
| 	while (i++ < retries) {
 | |
| 		hwsync();
 | |
| 		vas_copy(&cmdp->crb, 0);
 | |
| 		ret = vas_paste(nxhandle->paste_addr, 0);
 | |
| 		hwsync();
 | |
| 
 | |
| 		NXPRT(fprintf(stderr, "Paste attempt %d/%d returns 0x%x\n",
 | |
| 				i, retries, ret));
 | |
| 
 | |
| 		if ((ret == 2) || (ret == 3)) {
 | |
| 
 | |
| 			ret = nx_wait_for_csb(cmdp);
 | |
| 			if (!ret) {
 | |
| 				goto out;
 | |
| 			} else if (ret == -EAGAIN) {
 | |
| 				long x;
 | |
| 
 | |
| 				prt_err("Touching address %p, 0x%lx\n",
 | |
| 					 nx_fault_storage_address,
 | |
| 					 *(long *) nx_fault_storage_address);
 | |
| 				x = *(long *) nx_fault_storage_address;
 | |
| 				*(long *) nx_fault_storage_address = x;
 | |
| 				nx_fault_storage_address = 0;
 | |
| 				continue;
 | |
| 			} else {
 | |
| 				prt_err("wait_for_csb() returns %d\n", ret);
 | |
| 				break;
 | |
| 			}
 | |
| 		} else {
 | |
| 			if (i < 10) {
 | |
| 				/* spin for few ticks */
 | |
| #define SPIN_TH 500UL
 | |
| 				uint64_t fail_spin;
 | |
| 
 | |
| 				fail_spin = __ppc_get_timebase();
 | |
| 				while ((__ppc_get_timebase() - fail_spin) <
 | |
| 					 SPIN_TH)
 | |
| 					;
 | |
| 			} else {
 | |
| 				/* sleep */
 | |
| 				unsigned int pr = 0;
 | |
| 
 | |
| 				if (pr++ % 100 == 0) {
 | |
| 					prt_err("Paste attempt %d/", i);
 | |
| 					prt_err("%d, failed pid= %d\n", retries,
 | |
| 						getpid());
 | |
| 				}
 | |
| 				usleep(1);
 | |
| 			}
 | |
| 			continue;
 | |
| 		}
 | |
| 	}
 | |
| 
 | |
| out:
 | |
| 	cpu_pri_default();
 | |
| 
 | |
| 	return ret;
 | |
| }
 | |
| 
 | |
| int nxu_submit_job(struct nx_gzip_crb_cpb_t *cmdp, void *handle)
 | |
| {
 | |
| 	int cc;
 | |
| 
 | |
| 	cc = nxu_run_job(cmdp, handle);
 | |
| 
 | |
| 	if (!cc)
 | |
| 		cc = getnn(cmdp->crb.csb, csb_cc);      /* CC Table 6-8 */
 | |
| 
 | |
| 	return cc;
 | |
| }
 | |
| 
 | |
| 
 | |
| void nxu_sigsegv_handler(int sig, siginfo_t *info, void *ctx)
 | |
| {
 | |
| 	fprintf(stderr, "%d: Got signal %d si_code %d, si_addr %p\n", getpid(),
 | |
| 		sig, info->si_code, info->si_addr);
 | |
| 
 | |
| 	nx_fault_storage_address = info->si_addr;
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Fault in pages prior to NX job submission.  wr=1 may be required to
 | |
|  * touch writeable pages.  System zero pages do not fault-in the page as
 | |
|  * intended.  Typically set wr=1 for NX target pages and set wr=0 for NX
 | |
|  * source pages.
 | |
|  */
 | |
| int nxu_touch_pages(void *buf, long buf_len, long page_len, int wr)
 | |
| {
 | |
| 	char *begin = buf;
 | |
| 	char *end = (char *) buf + buf_len - 1;
 | |
| 	volatile char t;
 | |
| 
 | |
| 	assert(buf_len >= 0 && !!buf);
 | |
| 
 | |
| 	NXPRT(fprintf(stderr, "touch %p %p len 0x%lx wr=%d\n", buf,
 | |
| 			(buf + buf_len), buf_len, wr));
 | |
| 
 | |
| 	if (buf_len <= 0 || buf == NULL)
 | |
| 		return -1;
 | |
| 
 | |
| 	do {
 | |
| 		t = *begin;
 | |
| 		if (wr)
 | |
| 			*begin = t;
 | |
| 		begin = begin + page_len;
 | |
| 	} while (begin < end);
 | |
| 
 | |
| 	/* When buf_sz is small or buf tail is in another page */
 | |
| 	t = *end;
 | |
| 	if (wr)
 | |
| 		*end = t;
 | |
| 
 | |
| 	return 0;
 | |
| }
 |