17c478bd9Sstevel@tonic-gate /* 27c478bd9Sstevel@tonic-gate * CDDL HEADER START 37c478bd9Sstevel@tonic-gate * 47c478bd9Sstevel@tonic-gate * The contents of this file are subject to the terms of the 517169044Sbrutus * Common Development and Distribution License (the "License"). 617169044Sbrutus * You may not use this file except in compliance with the License. 77c478bd9Sstevel@tonic-gate * 87c478bd9Sstevel@tonic-gate * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 97c478bd9Sstevel@tonic-gate * or http://www.opensolaris.org/os/licensing. 107c478bd9Sstevel@tonic-gate * See the License for the specific language governing permissions 117c478bd9Sstevel@tonic-gate * and limitations under the License. 127c478bd9Sstevel@tonic-gate * 137c478bd9Sstevel@tonic-gate * When distributing Covered Code, include this CDDL HEADER in each 147c478bd9Sstevel@tonic-gate * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 157c478bd9Sstevel@tonic-gate * If applicable, add the following below this CDDL HEADER, with the 167c478bd9Sstevel@tonic-gate * fields enclosed by brackets "[]" replaced with your own identifying 177c478bd9Sstevel@tonic-gate * information: Portions Copyright [yyyy] [name of copyright owner] 187c478bd9Sstevel@tonic-gate * 197c478bd9Sstevel@tonic-gate * CDDL HEADER END 207c478bd9Sstevel@tonic-gate */ 217c478bd9Sstevel@tonic-gate /* 2217169044Sbrutus * Copyright 2008 Sun Microsystems, Inc. All rights reserved. 237c478bd9Sstevel@tonic-gate * Use is subject to license terms. 247c478bd9Sstevel@tonic-gate */ 257c478bd9Sstevel@tonic-gate 267c478bd9Sstevel@tonic-gate /* Copyright (c) 1984, 1986, 1987, 1988, 1989 AT&T */ 277c478bd9Sstevel@tonic-gate /* All Rights Reserved */ 287c478bd9Sstevel@tonic-gate 297c478bd9Sstevel@tonic-gate /* 307c478bd9Sstevel@tonic-gate * University Copyright- Copyright (c) 1982, 1986, 1988 317c478bd9Sstevel@tonic-gate * The Regents of the University of California 327c478bd9Sstevel@tonic-gate * All Rights Reserved 337c478bd9Sstevel@tonic-gate * 347c478bd9Sstevel@tonic-gate * University Acknowledgment- Portions of this document are derived from 357c478bd9Sstevel@tonic-gate * software developed by the University of California, Berkeley, and its 367c478bd9Sstevel@tonic-gate * contributors. 377c478bd9Sstevel@tonic-gate */ 387c478bd9Sstevel@tonic-gate 397c478bd9Sstevel@tonic-gate #include <sys/types.h> 407c478bd9Sstevel@tonic-gate #include <sys/sysmacros.h> 417c478bd9Sstevel@tonic-gate #include <sys/param.h> 427c478bd9Sstevel@tonic-gate #include <sys/systm.h> 437c478bd9Sstevel@tonic-gate #include <sys/uio.h> 447c478bd9Sstevel@tonic-gate #include <sys/errno.h> 4517169044Sbrutus #include <sys/vmsystm.h> 4617169044Sbrutus #include <sys/cmn_err.h> 4717169044Sbrutus #include <vm/as.h> 4817169044Sbrutus #include <vm/page.h> 4917169044Sbrutus 5017169044Sbrutus #include <sys/dcopy.h> 5117169044Sbrutus 5217169044Sbrutus int64_t uioa_maxpoll = -1; /* <0 = noblock, 0 = block, >0 = block after */ 5317169044Sbrutus #define UIO_DCOPY_CHANNEL 0 5417169044Sbrutus #define UIO_DCOPY_CMD 1 557c478bd9Sstevel@tonic-gate 567c478bd9Sstevel@tonic-gate /* 577c478bd9Sstevel@tonic-gate * Move "n" bytes at byte address "p"; "rw" indicates the direction 587c478bd9Sstevel@tonic-gate * of the move, and the I/O parameters are provided in "uio", which is 597c478bd9Sstevel@tonic-gate * update to reflect the data which was moved. Returns 0 on success or 607c478bd9Sstevel@tonic-gate * a non-zero errno on failure. 617c478bd9Sstevel@tonic-gate */ 627c478bd9Sstevel@tonic-gate int 637c478bd9Sstevel@tonic-gate uiomove(void *p, size_t n, enum uio_rw rw, struct uio *uio) 647c478bd9Sstevel@tonic-gate { 657c478bd9Sstevel@tonic-gate struct iovec *iov; 667c478bd9Sstevel@tonic-gate ulong_t cnt; 677c478bd9Sstevel@tonic-gate int error; 687c478bd9Sstevel@tonic-gate 697c478bd9Sstevel@tonic-gate while (n && uio->uio_resid) { 707c478bd9Sstevel@tonic-gate iov = uio->uio_iov; 717c478bd9Sstevel@tonic-gate cnt = MIN(iov->iov_len, n); 727c478bd9Sstevel@tonic-gate if (cnt == 0l) { 737c478bd9Sstevel@tonic-gate uio->uio_iov++; 747c478bd9Sstevel@tonic-gate uio->uio_iovcnt--; 757c478bd9Sstevel@tonic-gate continue; 767c478bd9Sstevel@tonic-gate } 777c478bd9Sstevel@tonic-gate switch (uio->uio_segflg) { 787c478bd9Sstevel@tonic-gate 797c478bd9Sstevel@tonic-gate case UIO_USERSPACE: 807c478bd9Sstevel@tonic-gate case UIO_USERISPACE: 817c478bd9Sstevel@tonic-gate if (rw == UIO_READ) { 827c478bd9Sstevel@tonic-gate error = xcopyout_nta(p, iov->iov_base, cnt, 837c478bd9Sstevel@tonic-gate (uio->uio_extflg & UIO_COPY_CACHED)); 847c478bd9Sstevel@tonic-gate } else { 857c478bd9Sstevel@tonic-gate error = xcopyin_nta(iov->iov_base, p, cnt, 867c478bd9Sstevel@tonic-gate (uio->uio_extflg & UIO_COPY_CACHED)); 877c478bd9Sstevel@tonic-gate } 887c478bd9Sstevel@tonic-gate 897c478bd9Sstevel@tonic-gate if (error) 907c478bd9Sstevel@tonic-gate return (error); 917c478bd9Sstevel@tonic-gate break; 927c478bd9Sstevel@tonic-gate 937c478bd9Sstevel@tonic-gate case UIO_SYSSPACE: 947c478bd9Sstevel@tonic-gate if (rw == UIO_READ) 957c478bd9Sstevel@tonic-gate error = kcopy_nta(p, iov->iov_base, cnt, 967c478bd9Sstevel@tonic-gate (uio->uio_extflg & UIO_COPY_CACHED)); 977c478bd9Sstevel@tonic-gate else 987c478bd9Sstevel@tonic-gate error = kcopy_nta(iov->iov_base, p, cnt, 997c478bd9Sstevel@tonic-gate (uio->uio_extflg & UIO_COPY_CACHED)); 1007c478bd9Sstevel@tonic-gate if (error) 1017c478bd9Sstevel@tonic-gate return (error); 1027c478bd9Sstevel@tonic-gate break; 1037c478bd9Sstevel@tonic-gate } 1047c478bd9Sstevel@tonic-gate iov->iov_base += cnt; 1057c478bd9Sstevel@tonic-gate iov->iov_len -= cnt; 1067c478bd9Sstevel@tonic-gate uio->uio_resid -= cnt; 1077c478bd9Sstevel@tonic-gate uio->uio_loffset += cnt; 1087c478bd9Sstevel@tonic-gate p = (caddr_t)p + cnt; 1097c478bd9Sstevel@tonic-gate n -= cnt; 1107c478bd9Sstevel@tonic-gate } 1117c478bd9Sstevel@tonic-gate return (0); 1127c478bd9Sstevel@tonic-gate } 1137c478bd9Sstevel@tonic-gate 1147c478bd9Sstevel@tonic-gate /* 1157c478bd9Sstevel@tonic-gate * transfer a character value into the address space 1167c478bd9Sstevel@tonic-gate * delineated by a uio and update fields within the 1177c478bd9Sstevel@tonic-gate * uio for next character. Return 0 for success, EFAULT 1187c478bd9Sstevel@tonic-gate * for error. 1197c478bd9Sstevel@tonic-gate */ 1207c478bd9Sstevel@tonic-gate int 1217c478bd9Sstevel@tonic-gate ureadc(int val, struct uio *uiop) 1227c478bd9Sstevel@tonic-gate { 1237c478bd9Sstevel@tonic-gate struct iovec *iovp; 1247c478bd9Sstevel@tonic-gate unsigned char c; 1257c478bd9Sstevel@tonic-gate 1267c478bd9Sstevel@tonic-gate /* 1277c478bd9Sstevel@tonic-gate * first determine if uio is valid. uiop should be 1287c478bd9Sstevel@tonic-gate * non-NULL and the resid count > 0. 1297c478bd9Sstevel@tonic-gate */ 1307c478bd9Sstevel@tonic-gate if (!(uiop && uiop->uio_resid > 0)) 1317c478bd9Sstevel@tonic-gate return (EFAULT); 1327c478bd9Sstevel@tonic-gate 1337c478bd9Sstevel@tonic-gate /* 1347c478bd9Sstevel@tonic-gate * scan through iovecs until one is found that is non-empty. 1357c478bd9Sstevel@tonic-gate * Return EFAULT if none found. 1367c478bd9Sstevel@tonic-gate */ 1377c478bd9Sstevel@tonic-gate while (uiop->uio_iovcnt > 0) { 1387c478bd9Sstevel@tonic-gate iovp = uiop->uio_iov; 1397c478bd9Sstevel@tonic-gate if (iovp->iov_len <= 0) { 1407c478bd9Sstevel@tonic-gate uiop->uio_iovcnt--; 1417c478bd9Sstevel@tonic-gate uiop->uio_iov++; 1427c478bd9Sstevel@tonic-gate } else 1437c478bd9Sstevel@tonic-gate break; 1447c478bd9Sstevel@tonic-gate } 1457c478bd9Sstevel@tonic-gate 1467c478bd9Sstevel@tonic-gate if (uiop->uio_iovcnt <= 0) 1477c478bd9Sstevel@tonic-gate return (EFAULT); 1487c478bd9Sstevel@tonic-gate 1497c478bd9Sstevel@tonic-gate /* 1507c478bd9Sstevel@tonic-gate * Transfer character to uio space. 1517c478bd9Sstevel@tonic-gate */ 1527c478bd9Sstevel@tonic-gate 1537c478bd9Sstevel@tonic-gate c = (unsigned char) (val & 0xFF); 1547c478bd9Sstevel@tonic-gate 1557c478bd9Sstevel@tonic-gate switch (uiop->uio_segflg) { 1567c478bd9Sstevel@tonic-gate 1577c478bd9Sstevel@tonic-gate case UIO_USERISPACE: 1587c478bd9Sstevel@tonic-gate case UIO_USERSPACE: 1597c478bd9Sstevel@tonic-gate if (copyout(&c, iovp->iov_base, sizeof (unsigned char))) 1607c478bd9Sstevel@tonic-gate return (EFAULT); 1617c478bd9Sstevel@tonic-gate break; 1627c478bd9Sstevel@tonic-gate 1637c478bd9Sstevel@tonic-gate case UIO_SYSSPACE: /* can do direct copy since kernel-kernel */ 1647c478bd9Sstevel@tonic-gate *iovp->iov_base = c; 1657c478bd9Sstevel@tonic-gate break; 1667c478bd9Sstevel@tonic-gate 1677c478bd9Sstevel@tonic-gate default: 1687c478bd9Sstevel@tonic-gate return (EFAULT); /* invalid segflg value */ 1697c478bd9Sstevel@tonic-gate } 1707c478bd9Sstevel@tonic-gate 1717c478bd9Sstevel@tonic-gate /* 1727c478bd9Sstevel@tonic-gate * bump up/down iovec and uio members to reflect transfer. 1737c478bd9Sstevel@tonic-gate */ 1747c478bd9Sstevel@tonic-gate iovp->iov_base++; 1757c478bd9Sstevel@tonic-gate iovp->iov_len--; 1767c478bd9Sstevel@tonic-gate uiop->uio_resid--; 1777c478bd9Sstevel@tonic-gate uiop->uio_loffset++; 1787c478bd9Sstevel@tonic-gate return (0); /* success */ 1797c478bd9Sstevel@tonic-gate } 1807c478bd9Sstevel@tonic-gate 1817c478bd9Sstevel@tonic-gate /* 1827c478bd9Sstevel@tonic-gate * return a character value from the address space 1837c478bd9Sstevel@tonic-gate * delineated by a uio and update fields within the 1847c478bd9Sstevel@tonic-gate * uio for next character. Return the character for success, 1857c478bd9Sstevel@tonic-gate * -1 for error. 1867c478bd9Sstevel@tonic-gate */ 1877c478bd9Sstevel@tonic-gate int 1887c478bd9Sstevel@tonic-gate uwritec(struct uio *uiop) 1897c478bd9Sstevel@tonic-gate { 1907c478bd9Sstevel@tonic-gate struct iovec *iovp; 1917c478bd9Sstevel@tonic-gate unsigned char c; 1927c478bd9Sstevel@tonic-gate 1937c478bd9Sstevel@tonic-gate /* 1947c478bd9Sstevel@tonic-gate * verify we were passed a valid uio structure. 1957c478bd9Sstevel@tonic-gate * (1) non-NULL uiop, (2) positive resid count 1967c478bd9Sstevel@tonic-gate * (3) there is an iovec with positive length 1977c478bd9Sstevel@tonic-gate */ 1987c478bd9Sstevel@tonic-gate 1997c478bd9Sstevel@tonic-gate if (!(uiop && uiop->uio_resid > 0)) 2007c478bd9Sstevel@tonic-gate return (-1); 2017c478bd9Sstevel@tonic-gate 2027c478bd9Sstevel@tonic-gate while (uiop->uio_iovcnt > 0) { 2037c478bd9Sstevel@tonic-gate iovp = uiop->uio_iov; 2047c478bd9Sstevel@tonic-gate if (iovp->iov_len <= 0) { 2057c478bd9Sstevel@tonic-gate uiop->uio_iovcnt--; 2067c478bd9Sstevel@tonic-gate uiop->uio_iov++; 2077c478bd9Sstevel@tonic-gate } else 2087c478bd9Sstevel@tonic-gate break; 2097c478bd9Sstevel@tonic-gate } 2107c478bd9Sstevel@tonic-gate 2117c478bd9Sstevel@tonic-gate if (uiop->uio_iovcnt <= 0) 2127c478bd9Sstevel@tonic-gate return (-1); 2137c478bd9Sstevel@tonic-gate 2147c478bd9Sstevel@tonic-gate /* 2157c478bd9Sstevel@tonic-gate * Get the character from the uio address space. 2167c478bd9Sstevel@tonic-gate */ 2177c478bd9Sstevel@tonic-gate switch (uiop->uio_segflg) { 2187c478bd9Sstevel@tonic-gate 2197c478bd9Sstevel@tonic-gate case UIO_USERISPACE: 2207c478bd9Sstevel@tonic-gate case UIO_USERSPACE: 2217c478bd9Sstevel@tonic-gate if (copyin(iovp->iov_base, &c, sizeof (unsigned char))) 2227c478bd9Sstevel@tonic-gate return (-1); 2237c478bd9Sstevel@tonic-gate break; 2247c478bd9Sstevel@tonic-gate 2257c478bd9Sstevel@tonic-gate case UIO_SYSSPACE: 2267c478bd9Sstevel@tonic-gate c = *iovp->iov_base; 2277c478bd9Sstevel@tonic-gate break; 2287c478bd9Sstevel@tonic-gate 2297c478bd9Sstevel@tonic-gate default: 2307c478bd9Sstevel@tonic-gate return (-1); /* invalid segflg */ 2317c478bd9Sstevel@tonic-gate } 2327c478bd9Sstevel@tonic-gate 2337c478bd9Sstevel@tonic-gate /* 2347c478bd9Sstevel@tonic-gate * Adjust fields of iovec and uio appropriately. 2357c478bd9Sstevel@tonic-gate */ 2367c478bd9Sstevel@tonic-gate iovp->iov_base++; 2377c478bd9Sstevel@tonic-gate iovp->iov_len--; 2387c478bd9Sstevel@tonic-gate uiop->uio_resid--; 2397c478bd9Sstevel@tonic-gate uiop->uio_loffset++; 2407c478bd9Sstevel@tonic-gate return ((int)c & 0xFF); /* success */ 2417c478bd9Sstevel@tonic-gate } 2427c478bd9Sstevel@tonic-gate 2437c478bd9Sstevel@tonic-gate /* 2447c478bd9Sstevel@tonic-gate * Drop the next n chars out of *uiop. 2457c478bd9Sstevel@tonic-gate */ 2467c478bd9Sstevel@tonic-gate void 2477c478bd9Sstevel@tonic-gate uioskip(uio_t *uiop, size_t n) 2487c478bd9Sstevel@tonic-gate { 2497c478bd9Sstevel@tonic-gate if (n > uiop->uio_resid) 2507c478bd9Sstevel@tonic-gate return; 2517c478bd9Sstevel@tonic-gate while (n != 0) { 2527c478bd9Sstevel@tonic-gate register iovec_t *iovp = uiop->uio_iov; 2537c478bd9Sstevel@tonic-gate register size_t niovb = MIN(iovp->iov_len, n); 2547c478bd9Sstevel@tonic-gate 2557c478bd9Sstevel@tonic-gate if (niovb == 0) { 2567c478bd9Sstevel@tonic-gate uiop->uio_iov++; 2577c478bd9Sstevel@tonic-gate uiop->uio_iovcnt--; 2587c478bd9Sstevel@tonic-gate continue; 2597c478bd9Sstevel@tonic-gate } 2607c478bd9Sstevel@tonic-gate iovp->iov_base += niovb; 2617c478bd9Sstevel@tonic-gate uiop->uio_loffset += niovb; 2627c478bd9Sstevel@tonic-gate iovp->iov_len -= niovb; 2637c478bd9Sstevel@tonic-gate uiop->uio_resid -= niovb; 2647c478bd9Sstevel@tonic-gate n -= niovb; 2657c478bd9Sstevel@tonic-gate } 2667c478bd9Sstevel@tonic-gate } 2677c478bd9Sstevel@tonic-gate 2687c478bd9Sstevel@tonic-gate /* 2697c478bd9Sstevel@tonic-gate * Dup the suio into the duio and diovec of size diov_cnt. If diov 2707c478bd9Sstevel@tonic-gate * is too small to dup suio then an error will be returned, else 0. 2717c478bd9Sstevel@tonic-gate */ 2727c478bd9Sstevel@tonic-gate int 2737c478bd9Sstevel@tonic-gate uiodup(uio_t *suio, uio_t *duio, iovec_t *diov, int diov_cnt) 2747c478bd9Sstevel@tonic-gate { 2757c478bd9Sstevel@tonic-gate int ix; 2767c478bd9Sstevel@tonic-gate iovec_t *siov = suio->uio_iov; 2777c478bd9Sstevel@tonic-gate 2787c478bd9Sstevel@tonic-gate *duio = *suio; 2797c478bd9Sstevel@tonic-gate for (ix = 0; ix < suio->uio_iovcnt; ix++) { 2807c478bd9Sstevel@tonic-gate diov[ix] = siov[ix]; 2817c478bd9Sstevel@tonic-gate if (ix >= diov_cnt) 2827c478bd9Sstevel@tonic-gate return (1); 2837c478bd9Sstevel@tonic-gate } 2847c478bd9Sstevel@tonic-gate duio->uio_iov = diov; 2857c478bd9Sstevel@tonic-gate return (0); 2867c478bd9Sstevel@tonic-gate } 28717169044Sbrutus 28817169044Sbrutus /* 28917169044Sbrutus * Shadow state for checking if a platform has hardware asynchronous 29017169044Sbrutus * copy capability and minimum copy size, e.g. Intel's I/OAT dma engine, 29117169044Sbrutus * 29217169044Sbrutus * Dcopy does a call-back to uioa_dcopy_enable() when a dma device calls 29317169044Sbrutus * into dcopy to register and uioa_dcopy_disable() when the device calls 29417169044Sbrutus * into dcopy to unregister. 29517169044Sbrutus */ 29617169044Sbrutus uioasync_t uioasync = {B_FALSE, 1024}; 29717169044Sbrutus 29817169044Sbrutus void 29917169044Sbrutus uioa_dcopy_enable() 30017169044Sbrutus { 30117169044Sbrutus uioasync.enabled = B_TRUE; 30217169044Sbrutus } 30317169044Sbrutus 30417169044Sbrutus void 30517169044Sbrutus uioa_dcopy_disable() 30617169044Sbrutus { 30717169044Sbrutus uioasync.enabled = B_FALSE; 30817169044Sbrutus } 30917169044Sbrutus 31017169044Sbrutus /* 31117169044Sbrutus * Schedule an asynchronous move of "n" bytes at byte address "p", 31217169044Sbrutus * "rw" indicates the direction of the move, I/O parameters and 31317169044Sbrutus * async state are provided in "uioa" which is update to reflect 31417169044Sbrutus * the data which is to be moved. 31517169044Sbrutus * 31617169044Sbrutus * Returns 0 on success or a non-zero errno on failure. 31717169044Sbrutus * 31817169044Sbrutus * Note, while the uioasync APIs are general purpose in design 31917169044Sbrutus * the current implementation is Intel I/OAT specific. 32017169044Sbrutus */ 32117169044Sbrutus int 32217169044Sbrutus uioamove(void *p, size_t n, enum uio_rw rw, uioa_t *uioa) 32317169044Sbrutus { 32417169044Sbrutus int soff, doff; 32517169044Sbrutus uint64_t pa; 32617169044Sbrutus int cnt; 32717169044Sbrutus iovec_t *iov; 32817169044Sbrutus dcopy_handle_t channel; 32917169044Sbrutus dcopy_cmd_t cmd; 33017169044Sbrutus int ret = 0; 33117169044Sbrutus int dcopy_flags; 33217169044Sbrutus 33317169044Sbrutus if (!(uioa->uioa_state & UIOA_ENABLED)) { 33417169044Sbrutus /* The uioa_t isn't enabled */ 33517169044Sbrutus return (ENXIO); 33617169044Sbrutus } 33717169044Sbrutus 33817169044Sbrutus if (uioa->uio_segflg != UIO_USERSPACE || rw != UIO_READ) { 33917169044Sbrutus /* Only support to user-land from kernel */ 34017169044Sbrutus return (ENOTSUP); 34117169044Sbrutus } 34217169044Sbrutus 34317169044Sbrutus 34417169044Sbrutus channel = uioa->uioa_hwst[UIO_DCOPY_CHANNEL]; 34517169044Sbrutus cmd = uioa->uioa_hwst[UIO_DCOPY_CMD]; 34617169044Sbrutus dcopy_flags = DCOPY_NOSLEEP; 34717169044Sbrutus 34817169044Sbrutus /* 34917169044Sbrutus * While source bytes and destination bytes. 35017169044Sbrutus */ 35117169044Sbrutus while (n > 0 && uioa->uio_resid > 0) { 35217169044Sbrutus iov = uioa->uio_iov; 35317169044Sbrutus if (iov->iov_len == 0l) { 35417169044Sbrutus uioa->uio_iov++; 35517169044Sbrutus uioa->uio_iovcnt--; 35617169044Sbrutus uioa->uioa_lcur++; 35717169044Sbrutus uioa->uioa_lppp = uioa->uioa_lcur->uioa_ppp; 35817169044Sbrutus continue; 35917169044Sbrutus } 36017169044Sbrutus /* 36117169044Sbrutus * While source bytes schedule an async 36217169044Sbrutus * dma for destination page by page. 36317169044Sbrutus */ 36417169044Sbrutus while (n > 0) { 36517169044Sbrutus /* Addr offset in page src/dst */ 36617169044Sbrutus soff = (uintptr_t)p & PAGEOFFSET; 36717169044Sbrutus doff = (uintptr_t)iov->iov_base & PAGEOFFSET; 36817169044Sbrutus /* Min copy count src and dst and page sized */ 36917169044Sbrutus cnt = MIN(n, iov->iov_len); 37017169044Sbrutus cnt = MIN(cnt, PAGESIZE - soff); 37117169044Sbrutus cnt = MIN(cnt, PAGESIZE - doff); 37217169044Sbrutus /* XXX if next page(s) contiguous could use multipage */ 37317169044Sbrutus 37417169044Sbrutus /* 37517169044Sbrutus * if we have an old command, we want to link all 37617169044Sbrutus * other commands to the next command we alloced so 37717169044Sbrutus * we only need to track the last command but can 37817169044Sbrutus * still free them all. 37917169044Sbrutus */ 38017169044Sbrutus if (cmd != NULL) { 38117169044Sbrutus dcopy_flags |= DCOPY_ALLOC_LINK; 38217169044Sbrutus } 38317169044Sbrutus ret = dcopy_cmd_alloc(channel, dcopy_flags, &cmd); 38417169044Sbrutus if (ret != DCOPY_SUCCESS) { 38517169044Sbrutus /* Error of some sort */ 38617169044Sbrutus return (EIO); 38717169044Sbrutus } 38817169044Sbrutus uioa->uioa_hwst[UIO_DCOPY_CMD] = cmd; 38917169044Sbrutus 39017169044Sbrutus ASSERT(cmd->dp_version == DCOPY_CMD_V0); 39117169044Sbrutus if (uioa_maxpoll >= 0) { 39217169044Sbrutus /* Blocking (>0 may be) used in uioafini() */ 39317169044Sbrutus cmd->dp_flags = DCOPY_CMD_INTR; 39417169044Sbrutus } else { 39517169044Sbrutus /* Non blocking uioafini() so no intr */ 39617169044Sbrutus cmd->dp_flags = DCOPY_CMD_NOFLAGS; 39717169044Sbrutus } 39817169044Sbrutus cmd->dp_cmd = DCOPY_CMD_COPY; 39917169044Sbrutus pa = ptob((uint64_t)hat_getpfnum(kas.a_hat, p)); 40017169044Sbrutus cmd->dp.copy.cc_source = pa + soff; 40117169044Sbrutus if (uioa->uioa_lcur->uioa_pfncnt == 0) { 40217169044Sbrutus /* Have a (page_t **) */ 40317169044Sbrutus pa = ptob((uint64_t)( 40417169044Sbrutus *(page_t **)uioa->uioa_lppp)->p_pagenum); 40517169044Sbrutus } else { 40617169044Sbrutus /* Have a (pfn_t *) */ 40717169044Sbrutus pa = ptob((uint64_t)( 40817169044Sbrutus *(pfn_t *)uioa->uioa_lppp)); 40917169044Sbrutus } 41017169044Sbrutus cmd->dp.copy.cc_dest = pa + doff; 41117169044Sbrutus cmd->dp.copy.cc_size = cnt; 41217169044Sbrutus ret = dcopy_cmd_post(cmd); 41317169044Sbrutus if (ret != DCOPY_SUCCESS) { 41417169044Sbrutus /* Error of some sort */ 41517169044Sbrutus return (EIO); 41617169044Sbrutus } 41717169044Sbrutus ret = 0; 41817169044Sbrutus 41917169044Sbrutus /* If UIOA_POLL not set, set it */ 42017169044Sbrutus if (!(uioa->uioa_state & UIOA_POLL)) 42117169044Sbrutus uioa->uioa_state |= UIOA_POLL; 42217169044Sbrutus 42317169044Sbrutus /* Update iov, uio, and local pointers/counters */ 42417169044Sbrutus iov->iov_base += cnt; 42517169044Sbrutus iov->iov_len -= cnt; 42617169044Sbrutus uioa->uio_resid -= cnt; 427*96e0e3daSYu Xiangning uioa->uioa_mbytes += cnt; 42817169044Sbrutus uioa->uio_loffset += cnt; 42917169044Sbrutus p = (caddr_t)p + cnt; 43017169044Sbrutus n -= cnt; 43117169044Sbrutus 43217169044Sbrutus /* End of iovec? */ 43317169044Sbrutus if (iov->iov_len == 0) { 43417169044Sbrutus /* Yup, next iovec */ 43517169044Sbrutus break; 43617169044Sbrutus } 43717169044Sbrutus 43817169044Sbrutus /* Next dst addr page? */ 43917169044Sbrutus if (doff + cnt == PAGESIZE) { 44017169044Sbrutus /* Yup, next page_t */ 44117169044Sbrutus uioa->uioa_lppp++; 44217169044Sbrutus } 44317169044Sbrutus } 44417169044Sbrutus } 44517169044Sbrutus 44617169044Sbrutus return (ret); 44717169044Sbrutus } 44817169044Sbrutus 44917169044Sbrutus /* 45017169044Sbrutus * Initialize a uioa_t for a given uio_t for the current user context, 45117169044Sbrutus * copy the common uio_t to the uioa_t, walk the shared iovec_t and 45217169044Sbrutus * lock down the user-land page(s) containing iovec_t data, then mapin 45317169044Sbrutus * user-land pages using segkpm. 45417169044Sbrutus */ 45517169044Sbrutus int 45617169044Sbrutus uioainit(uio_t *uiop, uioa_t *uioap) 45717169044Sbrutus { 45817169044Sbrutus caddr_t addr; 45917169044Sbrutus page_t **pages; 46017169044Sbrutus int off; 46117169044Sbrutus int len; 46217169044Sbrutus proc_t *procp = ttoproc(curthread); 46317169044Sbrutus struct as *as = procp->p_as; 46417169044Sbrutus iovec_t *iov = uiop->uio_iov; 46517169044Sbrutus int32_t iovcnt = uiop->uio_iovcnt; 46617169044Sbrutus uioa_page_t *locked = uioap->uioa_locked; 46717169044Sbrutus dcopy_handle_t channel; 46817169044Sbrutus int error; 46917169044Sbrutus 47017169044Sbrutus if (! (uioap->uioa_state & UIOA_ALLOC)) { 47117169044Sbrutus /* Can only init() a freshly allocated uioa_t */ 47217169044Sbrutus return (EINVAL); 47317169044Sbrutus } 47417169044Sbrutus 47517169044Sbrutus error = dcopy_alloc(DCOPY_NOSLEEP, &channel); 47617169044Sbrutus if (error == DCOPY_NORESOURCES) { 47717169044Sbrutus /* Turn off uioa */ 47817169044Sbrutus uioasync.enabled = B_FALSE; 47917169044Sbrutus return (ENODEV); 48017169044Sbrutus } 48117169044Sbrutus if (error != DCOPY_SUCCESS) { 48217169044Sbrutus /* Alloc failed */ 48317169044Sbrutus return (EIO); 48417169044Sbrutus } 48517169044Sbrutus 48617169044Sbrutus uioap->uioa_hwst[UIO_DCOPY_CHANNEL] = channel; 48717169044Sbrutus uioap->uioa_hwst[UIO_DCOPY_CMD] = NULL; 48817169044Sbrutus 48917169044Sbrutus /* Indicate uioa_t (will be) initialized */ 49017169044Sbrutus uioap->uioa_state = UIOA_INIT; 49117169044Sbrutus 492*96e0e3daSYu Xiangning uioap->uioa_mbytes = 0; 493*96e0e3daSYu Xiangning 494*96e0e3daSYu Xiangning uioap->uioa_mbytes = 0; 495*96e0e3daSYu Xiangning 49617169044Sbrutus /* uio_t/uioa_t uio_t common struct copy */ 49717169044Sbrutus *((uio_t *)uioap) = *uiop; 49817169044Sbrutus 49917169044Sbrutus /* initialize *uiop->uio_iov */ 50017169044Sbrutus if (iovcnt > UIOA_IOV_MAX) { 50117169044Sbrutus /* Too big? */ 50217169044Sbrutus return (E2BIG); 50317169044Sbrutus } 50417169044Sbrutus uioap->uio_iov = iov; 50517169044Sbrutus uioap->uio_iovcnt = iovcnt; 50617169044Sbrutus 50717169044Sbrutus /* Mark the uioap as such */ 50817169044Sbrutus uioap->uio_extflg |= UIO_ASYNC; 50917169044Sbrutus 51017169044Sbrutus /* 51117169044Sbrutus * For each iovec_t, lock-down the page(s) backing the iovec_t 51217169044Sbrutus * and save the page_t list for phys addr use in uioamove(). 51317169044Sbrutus */ 51417169044Sbrutus iov = uiop->uio_iov; 51517169044Sbrutus iovcnt = uiop->uio_iovcnt; 51617169044Sbrutus while (iovcnt > 0) { 51717169044Sbrutus addr = iov->iov_base; 51817169044Sbrutus off = (uintptr_t)addr & PAGEOFFSET; 51917169044Sbrutus addr = (caddr_t)((uintptr_t)addr & (uintptr_t)PAGEMASK); 52017169044Sbrutus len = iov->iov_len + off; 52117169044Sbrutus 52217169044Sbrutus /* Lock down page(s) for the iov span */ 52317169044Sbrutus if ((error = as_pagelock(as, &pages, 52417169044Sbrutus iov->iov_base, iov->iov_len, S_WRITE)) != 0) { 52517169044Sbrutus /* Error */ 52617169044Sbrutus goto cleanup; 52717169044Sbrutus } 52817169044Sbrutus 52917169044Sbrutus if (pages == NULL) { 53017169044Sbrutus /* 53117169044Sbrutus * Need page_t list, really only need 53217169044Sbrutus * a pfn list so build one. 53317169044Sbrutus */ 53417169044Sbrutus pfn_t *pfnp; 53517169044Sbrutus int pcnt = len >> PAGESHIFT; 53617169044Sbrutus 53717169044Sbrutus if (off) 53817169044Sbrutus pcnt++; 53917169044Sbrutus if ((pfnp = kmem_alloc(pcnt * sizeof (pfnp), 54017169044Sbrutus KM_NOSLEEP)) == NULL) { 54117169044Sbrutus error = ENOMEM; 54217169044Sbrutus goto cleanup; 54317169044Sbrutus } 54417169044Sbrutus locked->uioa_ppp = (void **)pfnp; 54517169044Sbrutus locked->uioa_pfncnt = pcnt; 54617169044Sbrutus AS_LOCK_ENTER(as, &as->a_lock, RW_READER); 54717169044Sbrutus while (pcnt-- > 0) { 54817169044Sbrutus *pfnp++ = hat_getpfnum(as->a_hat, addr); 54917169044Sbrutus addr += PAGESIZE; 55017169044Sbrutus } 55117169044Sbrutus AS_LOCK_EXIT(as, &as->a_lock); 55217169044Sbrutus } else { 55317169044Sbrutus /* Have a page_t list, save it */ 55417169044Sbrutus locked->uioa_ppp = (void **)pages; 55517169044Sbrutus locked->uioa_pfncnt = 0; 55617169044Sbrutus } 55717169044Sbrutus /* Save for as_pageunlock() in uioafini() */ 55817169044Sbrutus locked->uioa_base = iov->iov_base; 55917169044Sbrutus locked->uioa_len = iov->iov_len; 56017169044Sbrutus locked++; 56117169044Sbrutus 56217169044Sbrutus /* Next iovec_t */ 56317169044Sbrutus iov++; 56417169044Sbrutus iovcnt--; 56517169044Sbrutus } 56617169044Sbrutus /* Initialize curret pointer into uioa_locked[] and it's uioa_ppp */ 56717169044Sbrutus uioap->uioa_lcur = uioap->uioa_locked; 56817169044Sbrutus uioap->uioa_lppp = uioap->uioa_lcur->uioa_ppp; 56917169044Sbrutus return (0); 57017169044Sbrutus 57117169044Sbrutus cleanup: 57217169044Sbrutus /* Unlock any previously locked page_t(s) */ 57317169044Sbrutus while (locked > uioap->uioa_locked) { 57417169044Sbrutus locked--; 57517169044Sbrutus as_pageunlock(as, (page_t **)locked->uioa_ppp, 57617169044Sbrutus locked->uioa_base, locked->uioa_len, S_WRITE); 57717169044Sbrutus } 57817169044Sbrutus 57917169044Sbrutus /* Last indicate uioa_t still in alloc state */ 58017169044Sbrutus uioap->uioa_state = UIOA_ALLOC; 581*96e0e3daSYu Xiangning uioap->uioa_mbytes = 0; 58217169044Sbrutus 58317169044Sbrutus return (error); 58417169044Sbrutus } 58517169044Sbrutus 58617169044Sbrutus /* 58717169044Sbrutus * Finish processing of a uioa_t by cleanup any pending "uioap" actions. 58817169044Sbrutus */ 58917169044Sbrutus int 59017169044Sbrutus uioafini(uio_t *uiop, uioa_t *uioap) 59117169044Sbrutus { 59217169044Sbrutus int32_t iovcnt = uiop->uio_iovcnt; 59317169044Sbrutus uioa_page_t *locked = uioap->uioa_locked; 59417169044Sbrutus struct as *as = ttoproc(curthread)->p_as; 59517169044Sbrutus dcopy_handle_t channel; 59617169044Sbrutus dcopy_cmd_t cmd; 59717169044Sbrutus int ret = 0; 59817169044Sbrutus 59917169044Sbrutus ASSERT(uioap->uio_extflg & UIO_ASYNC); 60017169044Sbrutus 60117169044Sbrutus if (!(uioap->uioa_state & (UIOA_ENABLED|UIOA_FINI))) { 60217169044Sbrutus /* Must be an active uioa_t */ 60317169044Sbrutus return (EINVAL); 60417169044Sbrutus } 60517169044Sbrutus 60617169044Sbrutus channel = uioap->uioa_hwst[UIO_DCOPY_CHANNEL]; 60717169044Sbrutus cmd = uioap->uioa_hwst[UIO_DCOPY_CMD]; 60817169044Sbrutus 60917169044Sbrutus /* XXX - why do we get cmd == NULL sometimes? */ 61017169044Sbrutus if (cmd != NULL) { 61117169044Sbrutus if (uioap->uioa_state & UIOA_POLL) { 61217169044Sbrutus /* Wait for last dcopy() to finish */ 61317169044Sbrutus int64_t poll = 1; 61417169044Sbrutus int poll_flag = DCOPY_POLL_NOFLAGS; 61517169044Sbrutus 61617169044Sbrutus do { 61717169044Sbrutus if (uioa_maxpoll == 0 || 61817169044Sbrutus (uioa_maxpoll > 0 && 61917169044Sbrutus poll >= uioa_maxpoll)) { 62017169044Sbrutus /* Always block or after maxpoll */ 62117169044Sbrutus poll_flag = DCOPY_POLL_BLOCK; 62217169044Sbrutus } else { 62317169044Sbrutus /* No block, poll */ 62417169044Sbrutus poll++; 62517169044Sbrutus } 62617169044Sbrutus ret = dcopy_cmd_poll(cmd, poll_flag); 62717169044Sbrutus } while (ret == DCOPY_PENDING); 62817169044Sbrutus 62917169044Sbrutus if (ret == DCOPY_COMPLETED) { 63017169044Sbrutus /* Poll/block succeeded */ 63117169044Sbrutus ret = 0; 63217169044Sbrutus } else { 63317169044Sbrutus /* Poll/block failed */ 63417169044Sbrutus ret = EIO; 63517169044Sbrutus } 63617169044Sbrutus } 63717169044Sbrutus dcopy_cmd_free(&cmd); 63817169044Sbrutus } 63917169044Sbrutus 64017169044Sbrutus dcopy_free(&channel); 64117169044Sbrutus 64217169044Sbrutus /* Unlock all page(s) iovec_t by iovec_t */ 64317169044Sbrutus while (iovcnt-- > 0) { 64417169044Sbrutus page_t **pages; 64517169044Sbrutus 64617169044Sbrutus if (locked->uioa_pfncnt == 0) { 64717169044Sbrutus /* A as_pagelock() returned (page_t **) */ 64817169044Sbrutus pages = (page_t **)locked->uioa_ppp; 64917169044Sbrutus } else { 65017169044Sbrutus /* Our pfn_t array */ 65117169044Sbrutus pages = NULL; 65217169044Sbrutus kmem_free(locked->uioa_ppp, locked->uioa_pfncnt * 65317169044Sbrutus sizeof (pfn_t *)); 65417169044Sbrutus } 65517169044Sbrutus as_pageunlock(as, pages, locked->uioa_base, locked->uioa_len, 65617169044Sbrutus S_WRITE); 65717169044Sbrutus 65817169044Sbrutus locked++; 65917169044Sbrutus } 66017169044Sbrutus /* uioa_t->uio_t common struct copy */ 66117169044Sbrutus *uiop = *((uio_t *)uioap); 66217169044Sbrutus 66317169044Sbrutus /* 66417169044Sbrutus * Last, reset uioa state to alloc. 66517169044Sbrutus * 66617169044Sbrutus * Note, we only initialize the state here, all other members 66717169044Sbrutus * will be initialized in a subsequent uioainit(). 66817169044Sbrutus */ 66917169044Sbrutus uioap->uioa_state = UIOA_ALLOC; 670*96e0e3daSYu Xiangning uioap->uioa_mbytes = 0; 67117169044Sbrutus 67217169044Sbrutus uioap->uioa_hwst[UIO_DCOPY_CMD] = NULL; 67317169044Sbrutus uioap->uioa_hwst[UIO_DCOPY_CHANNEL] = NULL; 67417169044Sbrutus 67517169044Sbrutus return (ret); 67617169044Sbrutus } 677