317 lines
6.3 KiB
C
317 lines
6.3 KiB
C
|
// SPDX-License-Identifier: GPL-2.0-or-later
|
||
|
|
||
|
/*
|
||
|
* Copyright 2020 IBM Corp.
|
||
|
*
|
||
|
* Author: Bulent Abali <abali@us.ibm.com>
|
||
|
*
|
||
|
*/
|
||
|
#include <stdio.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <string.h>
|
||
|
#include <unistd.h>
|
||
|
#include <stdint.h>
|
||
|
#include <sys/types.h>
|
||
|
#include <sys/stat.h>
|
||
|
#include <sys/time.h>
|
||
|
#include <sys/fcntl.h>
|
||
|
#include <sys/mman.h>
|
||
|
#include <endian.h>
|
||
|
#include <bits/endian.h>
|
||
|
#include <sys/ioctl.h>
|
||
|
#include <assert.h>
|
||
|
#include <errno.h>
|
||
|
#include <signal.h>
|
||
|
#include "vas-api.h"
|
||
|
#include "nx.h"
|
||
|
#include "copy-paste.h"
|
||
|
#include "nxu.h"
|
||
|
#include "nx_dbg.h"
|
||
|
#include <sys/platform/ppc.h>
|
||
|
|
||
|
#define barrier()
|
||
|
#define hwsync() ({ asm volatile("sync" ::: "memory"); })
|
||
|
|
||
|
#ifndef NX_NO_CPU_PRI
|
||
|
#define cpu_pri_default() ({ asm volatile ("or 2, 2, 2"); })
|
||
|
#define cpu_pri_low() ({ asm volatile ("or 31, 31, 31"); })
|
||
|
#else
|
||
|
#define cpu_pri_default()
|
||
|
#define cpu_pri_low()
|
||
|
#endif
|
||
|
|
||
|
void *nx_fault_storage_address;
|
||
|
|
||
|
struct nx_handle {
|
||
|
int fd;
|
||
|
int function;
|
||
|
void *paste_addr;
|
||
|
};
|
||
|
|
||
|
static int open_device_nodes(char *devname, int pri, struct nx_handle *handle)
|
||
|
{
|
||
|
int rc, fd;
|
||
|
void *addr;
|
||
|
struct vas_tx_win_open_attr txattr;
|
||
|
|
||
|
fd = open(devname, O_RDWR);
|
||
|
if (fd < 0) {
|
||
|
fprintf(stderr, " open device name %s\n", devname);
|
||
|
return -errno;
|
||
|
}
|
||
|
|
||
|
memset(&txattr, 0, sizeof(txattr));
|
||
|
txattr.version = 1;
|
||
|
txattr.vas_id = pri;
|
||
|
rc = ioctl(fd, VAS_TX_WIN_OPEN, (unsigned long)&txattr);
|
||
|
if (rc < 0) {
|
||
|
fprintf(stderr, "ioctl() n %d, error %d\n", rc, errno);
|
||
|
rc = -errno;
|
||
|
goto out;
|
||
|
}
|
||
|
|
||
|
addr = mmap(NULL, 4096, PROT_READ|PROT_WRITE, MAP_SHARED, fd, 0ULL);
|
||
|
if (addr == MAP_FAILED) {
|
||
|
fprintf(stderr, "mmap() failed, errno %d\n", errno);
|
||
|
rc = -errno;
|
||
|
goto out;
|
||
|
}
|
||
|
handle->fd = fd;
|
||
|
handle->paste_addr = (void *)((char *)addr + 0x400);
|
||
|
|
||
|
rc = 0;
|
||
|
out:
|
||
|
close(fd);
|
||
|
return rc;
|
||
|
}
|
||
|
|
||
|
void *nx_function_begin(int function, int pri)
|
||
|
{
|
||
|
int rc;
|
||
|
char *devname = "/dev/crypto/nx-gzip";
|
||
|
struct nx_handle *nxhandle;
|
||
|
|
||
|
if (function != NX_FUNC_COMP_GZIP) {
|
||
|
errno = EINVAL;
|
||
|
fprintf(stderr, " NX_FUNC_COMP_GZIP not found\n");
|
||
|
return NULL;
|
||
|
}
|
||
|
|
||
|
|
||
|
nxhandle = malloc(sizeof(*nxhandle));
|
||
|
if (!nxhandle) {
|
||
|
errno = ENOMEM;
|
||
|
fprintf(stderr, " No memory\n");
|
||
|
return NULL;
|
||
|
}
|
||
|
|
||
|
nxhandle->function = function;
|
||
|
rc = open_device_nodes(devname, pri, nxhandle);
|
||
|
if (rc < 0) {
|
||
|
errno = -rc;
|
||
|
fprintf(stderr, " open_device_nodes failed\n");
|
||
|
return NULL;
|
||
|
}
|
||
|
|
||
|
return nxhandle;
|
||
|
}
|
||
|
|
||
|
int nx_function_end(void *handle)
|
||
|
{
|
||
|
int rc = 0;
|
||
|
struct nx_handle *nxhandle = handle;
|
||
|
|
||
|
rc = munmap(nxhandle->paste_addr - 0x400, 4096);
|
||
|
if (rc < 0) {
|
||
|
fprintf(stderr, "munmap() failed, errno %d\n", errno);
|
||
|
return rc;
|
||
|
}
|
||
|
close(nxhandle->fd);
|
||
|
free(nxhandle);
|
||
|
|
||
|
return rc;
|
||
|
}
|
||
|
|
||
|
static int nx_wait_for_csb(struct nx_gzip_crb_cpb_t *cmdp)
|
||
|
{
|
||
|
long poll = 0;
|
||
|
uint64_t t;
|
||
|
|
||
|
/* Save power and let other threads use the h/w. top may show
|
||
|
* 100% but only because OS doesn't know we slowed the this
|
||
|
* h/w thread while polling. We're letting other threads have
|
||
|
* higher throughput on the core.
|
||
|
*/
|
||
|
cpu_pri_low();
|
||
|
|
||
|
#define CSB_MAX_POLL 200000000UL
|
||
|
#define USLEEP_TH 300000UL
|
||
|
|
||
|
t = __ppc_get_timebase();
|
||
|
|
||
|
while (getnn(cmdp->crb.csb, csb_v) == 0) {
|
||
|
++poll;
|
||
|
hwsync();
|
||
|
|
||
|
cpu_pri_low();
|
||
|
|
||
|
/* usleep(0) takes around 29000 ticks ~60 us.
|
||
|
* 300000 is spinning for about 600 us then
|
||
|
* start sleeping.
|
||
|
*/
|
||
|
if ((__ppc_get_timebase() - t) > USLEEP_TH) {
|
||
|
cpu_pri_default();
|
||
|
usleep(1);
|
||
|
}
|
||
|
|
||
|
if (poll > CSB_MAX_POLL)
|
||
|
break;
|
||
|
|
||
|
/* Fault address from signal handler */
|
||
|
if (nx_fault_storage_address) {
|
||
|
cpu_pri_default();
|
||
|
return -EAGAIN;
|
||
|
}
|
||
|
|
||
|
}
|
||
|
|
||
|
cpu_pri_default();
|
||
|
|
||
|
/* hw has updated csb and output buffer */
|
||
|
hwsync();
|
||
|
|
||
|
/* Check CSB flags. */
|
||
|
if (getnn(cmdp->crb.csb, csb_v) == 0) {
|
||
|
fprintf(stderr, "CSB still not valid after %d polls.\n",
|
||
|
(int) poll);
|
||
|
prt_err("CSB still not valid after %d polls, giving up.\n",
|
||
|
(int) poll);
|
||
|
return -ETIMEDOUT;
|
||
|
}
|
||
|
|
||
|
return 0;
|
||
|
}
|
||
|
|
||
|
static int nxu_run_job(struct nx_gzip_crb_cpb_t *cmdp, void *handle)
|
||
|
{
|
||
|
int i, ret, retries;
|
||
|
struct nx_handle *nxhandle = handle;
|
||
|
|
||
|
assert(handle != NULL);
|
||
|
i = 0;
|
||
|
retries = 5000;
|
||
|
while (i++ < retries) {
|
||
|
hwsync();
|
||
|
vas_copy(&cmdp->crb, 0);
|
||
|
ret = vas_paste(nxhandle->paste_addr, 0);
|
||
|
hwsync();
|
||
|
|
||
|
NXPRT(fprintf(stderr, "Paste attempt %d/%d returns 0x%x\n",
|
||
|
i, retries, ret));
|
||
|
|
||
|
if ((ret == 2) || (ret == 3)) {
|
||
|
|
||
|
ret = nx_wait_for_csb(cmdp);
|
||
|
if (!ret) {
|
||
|
goto out;
|
||
|
} else if (ret == -EAGAIN) {
|
||
|
long x;
|
||
|
|
||
|
prt_err("Touching address %p, 0x%lx\n",
|
||
|
nx_fault_storage_address,
|
||
|
*(long *) nx_fault_storage_address);
|
||
|
x = *(long *) nx_fault_storage_address;
|
||
|
*(long *) nx_fault_storage_address = x;
|
||
|
nx_fault_storage_address = 0;
|
||
|
continue;
|
||
|
} else {
|
||
|
prt_err("wait_for_csb() returns %d\n", ret);
|
||
|
break;
|
||
|
}
|
||
|
} else {
|
||
|
if (i < 10) {
|
||
|
/* spin for few ticks */
|
||
|
#define SPIN_TH 500UL
|
||
|
uint64_t fail_spin;
|
||
|
|
||
|
fail_spin = __ppc_get_timebase();
|
||
|
while ((__ppc_get_timebase() - fail_spin) <
|
||
|
SPIN_TH)
|
||
|
;
|
||
|
} else {
|
||
|
/* sleep */
|
||
|
unsigned int pr = 0;
|
||
|
|
||
|
if (pr++ % 100 == 0) {
|
||
|
prt_err("Paste attempt %d/", i);
|
||
|
prt_err("%d, failed pid= %d\n", retries,
|
||
|
getpid());
|
||
|
}
|
||
|
usleep(1);
|
||
|
}
|
||
|
continue;
|
||
|
}
|
||
|
}
|
||
|
|
||
|
out:
|
||
|
cpu_pri_default();
|
||
|
|
||
|
return ret;
|
||
|
}
|
||
|
|
||
|
int nxu_submit_job(struct nx_gzip_crb_cpb_t *cmdp, void *handle)
|
||
|
{
|
||
|
int cc;
|
||
|
|
||
|
cc = nxu_run_job(cmdp, handle);
|
||
|
|
||
|
if (!cc)
|
||
|
cc = getnn(cmdp->crb.csb, csb_cc); /* CC Table 6-8 */
|
||
|
|
||
|
return cc;
|
||
|
}
|
||
|
|
||
|
|
||
|
void nxu_sigsegv_handler(int sig, siginfo_t *info, void *ctx)
|
||
|
{
|
||
|
fprintf(stderr, "%d: Got signal %d si_code %d, si_addr %p\n", getpid(),
|
||
|
sig, info->si_code, info->si_addr);
|
||
|
|
||
|
nx_fault_storage_address = info->si_addr;
|
||
|
}
|
||
|
|
||
|
/*
|
||
|
* Fault in pages prior to NX job submission. wr=1 may be required to
|
||
|
* touch writeable pages. System zero pages do not fault-in the page as
|
||
|
* intended. Typically set wr=1 for NX target pages and set wr=0 for NX
|
||
|
* source pages.
|
||
|
*/
|
||
|
int nxu_touch_pages(void *buf, long buf_len, long page_len, int wr)
|
||
|
{
|
||
|
char *begin = buf;
|
||
|
char *end = (char *) buf + buf_len - 1;
|
||
|
volatile char t;
|
||
|
|
||
|
assert(buf_len >= 0 && !!buf);
|
||
|
|
||
|
NXPRT(fprintf(stderr, "touch %p %p len 0x%lx wr=%d\n", buf,
|
||
|
(buf + buf_len), buf_len, wr));
|
||
|
|
||
|
if (buf_len <= 0 || buf == NULL)
|
||
|
return -1;
|
||
|
|
||
|
do {
|
||
|
t = *begin;
|
||
|
if (wr)
|
||
|
*begin = t;
|
||
|
begin = begin + page_len;
|
||
|
} while (begin < end);
|
||
|
|
||
|
/* When buf_sz is small or buf tail is in another page */
|
||
|
t = *end;
|
||
|
if (wr)
|
||
|
*end = t;
|
||
|
|
||
|
return 0;
|
||
|
}
|