11ae08745Sheppo /* 21ae08745Sheppo * CDDL HEADER START 31ae08745Sheppo * 41ae08745Sheppo * The contents of this file are subject to the terms of the 51ae08745Sheppo * Common Development and Distribution License (the "License"). 61ae08745Sheppo * You may not use this file except in compliance with the License. 71ae08745Sheppo * 81ae08745Sheppo * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE 91ae08745Sheppo * or http://www.opensolaris.org/os/licensing. 101ae08745Sheppo * See the License for the specific language governing permissions 111ae08745Sheppo * and limitations under the License. 121ae08745Sheppo * 131ae08745Sheppo * When distributing Covered Code, include this CDDL HEADER in each 141ae08745Sheppo * file and include the License file at usr/src/OPENSOLARIS.LICENSE. 151ae08745Sheppo * If applicable, add the following below this CDDL HEADER, with the 161ae08745Sheppo * fields enclosed by brackets "[]" replaced with your own identifying 171ae08745Sheppo * information: Portions Copyright [yyyy] [name of copyright owner] 181ae08745Sheppo * 191ae08745Sheppo * CDDL HEADER END 201ae08745Sheppo */ 211ae08745Sheppo 221ae08745Sheppo /* 23655fd6a9Sachartre * Copyright 2007 Sun Microsystems, Inc. All rights reserved. 241ae08745Sheppo * Use is subject to license terms. 251ae08745Sheppo */ 261ae08745Sheppo 271ae08745Sheppo #ifndef _VDC_H 281ae08745Sheppo #define _VDC_H 291ae08745Sheppo 301ae08745Sheppo #pragma ident "%Z%%M% %I% %E% SMI" 311ae08745Sheppo 321ae08745Sheppo /* 331ae08745Sheppo * Virtual disk client implementation definitions 341ae08745Sheppo */ 351ae08745Sheppo 361ae08745Sheppo #include <sys/sysmacros.h> 371ae08745Sheppo #include <sys/note.h> 381ae08745Sheppo 391ae08745Sheppo #include <sys/ldc.h> 401ae08745Sheppo #include <sys/vio_mailbox.h> 411ae08745Sheppo #include <sys/vdsk_mailbox.h> 421ae08745Sheppo #include <sys/vdsk_common.h> 431ae08745Sheppo 441ae08745Sheppo #ifdef __cplusplus 451ae08745Sheppo extern "C" { 461ae08745Sheppo #endif 471ae08745Sheppo 481ae08745Sheppo #define VDC_DRIVER_NAME "vdc" 491ae08745Sheppo 501ae08745Sheppo /* 511ae08745Sheppo * Bit-field values to indicate if parts of the vdc driver are initialised. 521ae08745Sheppo */ 531ae08745Sheppo #define VDC_SOFT_STATE 0x0001 541ae08745Sheppo #define VDC_LOCKS 0x0002 551ae08745Sheppo #define VDC_MINOR 0x0004 561ae08745Sheppo #define VDC_THREAD 0x0008 571ae08745Sheppo #define VDC_LDC 0x0010 581ae08745Sheppo #define VDC_LDC_INIT 0x0020 591ae08745Sheppo #define VDC_LDC_CB 0x0040 601ae08745Sheppo #define VDC_LDC_OPEN 0x0080 611ae08745Sheppo #define VDC_DRING_INIT 0x0100 /* The DRing was created */ 621ae08745Sheppo #define VDC_DRING_BOUND 0x0200 /* The DRing was bound to an LDC channel */ 631ae08745Sheppo #define VDC_DRING_LOCAL 0x0400 /* The local private DRing was allocated */ 641ae08745Sheppo #define VDC_DRING_ENTRY 0x0800 /* At least one DRing entry was initialised */ 651ae08745Sheppo #define VDC_DRING (VDC_DRING_INIT | VDC_DRING_BOUND | \ 661ae08745Sheppo VDC_DRING_LOCAL | VDC_DRING_ENTRY) 671ae08745Sheppo #define VDC_HANDSHAKE 0x1000 /* Indicates if a handshake is in progress */ 681ae08745Sheppo #define VDC_HANDSHAKE_STOP 0x2000 /* stop further handshakes */ 691ae08745Sheppo 701ae08745Sheppo /* 711ae08745Sheppo * Definitions of strings to be used to create device node properties. 721ae08745Sheppo * (vdc uses the capitalised versions of these properties as they are 64-bit) 731ae08745Sheppo */ 741ae08745Sheppo #define VDC_NBLOCKS_PROP_NAME "Nblocks" 751ae08745Sheppo #define VDC_SIZE_PROP_NAME "Size" 761ae08745Sheppo 771ae08745Sheppo /* 781ae08745Sheppo * Definitions of MD nodes/properties. 791ae08745Sheppo */ 801ae08745Sheppo #define VDC_MD_CHAN_NAME "channel-endpoint" 811ae08745Sheppo #define VDC_MD_VDEV_NAME "virtual-device" 82655fd6a9Sachartre #define VDC_MD_PORT_NAME "virtual-device-port" 831ae08745Sheppo #define VDC_MD_DISK_NAME "disk" 841ae08745Sheppo #define VDC_MD_CFG_HDL "cfg-handle" 85655fd6a9Sachartre #define VDC_MD_TIMEOUT "vdc-timeout" 86655fd6a9Sachartre #define VDC_MD_ID "id" 871ae08745Sheppo 881ae08745Sheppo /* 89e1ebb9ecSlm66018 * Definition of actions to be carried out when processing the sequence ID 90e1ebb9ecSlm66018 * of a message received from the vDisk server. The function verifying the 91e1ebb9ecSlm66018 * sequence number checks the 'seq_num_xxx' fields in the soft state and 92e1ebb9ecSlm66018 * returns whether the message should be processed (VDC_SEQ_NUM_TODO) or 93e1ebb9ecSlm66018 * whether it was it was previously processed (VDC_SEQ_NUM_SKIP). 94e1ebb9ecSlm66018 */ 95e1ebb9ecSlm66018 #define VDC_SEQ_NUM_INVALID -1 /* Error */ 96e1ebb9ecSlm66018 #define VDC_SEQ_NUM_SKIP 0 /* Request already processed */ 97e1ebb9ecSlm66018 #define VDC_SEQ_NUM_TODO 1 /* Request needs processing */ 98e1ebb9ecSlm66018 99e1ebb9ecSlm66018 /* 1000d0c8d4bSnarayan * Macros to get UNIT and PART number 1011ae08745Sheppo */ 1020d0c8d4bSnarayan #define VDCUNIT_SHIFT 3 1030d0c8d4bSnarayan #define VDCPART_MASK 7 1040d0c8d4bSnarayan 1050d0c8d4bSnarayan #define VDCUNIT(dev) (getminor((dev)) >> VDCUNIT_SHIFT) 1060d0c8d4bSnarayan #define VDCPART(dev) (getminor((dev)) & VDCPART_MASK) 1070d0c8d4bSnarayan 1080d0c8d4bSnarayan /* 1090d0c8d4bSnarayan * Scheme to store the instance number and the slice number in the minor number. 1100d0c8d4bSnarayan * (NOTE: Uses the same format and definitions as the sd(7D) driver) 1110d0c8d4bSnarayan */ 1120d0c8d4bSnarayan #define VD_MAKE_DEV(instance, minor) ((instance << VDCUNIT_SHIFT) | minor) 1131ae08745Sheppo 1141ae08745Sheppo /* 1151ae08745Sheppo * variables controlling how long to wait before timing out and how many 1161ae08745Sheppo * retries to attempt before giving up when communicating with vds. 117e1ebb9ecSlm66018 * 118e1ebb9ecSlm66018 * These values need to be sufficiently large so that a guest can survive 119e1ebb9ecSlm66018 * the reboot of the service domain. 1201ae08745Sheppo */ 121e1ebb9ecSlm66018 #define VDC_RETRIES 10 1221ae08745Sheppo 1231ae08745Sheppo #define VDC_USEC_TIMEOUT_MIN (30 * MICROSEC) /* 30 sec */ 1241ae08745Sheppo 125e1ebb9ecSlm66018 /* 126e1ebb9ecSlm66018 * This macro returns the number of Hz that the vdc driver should wait before 127e1ebb9ecSlm66018 * a timeout is triggered. The 'timeout' parameter specifiecs the wait 128e1ebb9ecSlm66018 * time in Hz. The 'mul' parameter allows for a multiplier to be 129e1ebb9ecSlm66018 * specified allowing for a backoff to be implemented (e.g. using the 130e1ebb9ecSlm66018 * retry number as a multiplier) where the wait time will get longer if 131e1ebb9ecSlm66018 * there is no response on the previous retry. 132e1ebb9ecSlm66018 */ 133e1ebb9ecSlm66018 #define VD_GET_TIMEOUT_HZ(timeout, mul) \ 134e1ebb9ecSlm66018 (ddi_get_lbolt() + ((timeout) * MAX(1, (mul)))) 1351ae08745Sheppo 1361ae08745Sheppo /* 1371ae08745Sheppo * Macros to manipulate Descriptor Ring variables in the soft state 1381ae08745Sheppo * structure. 1391ae08745Sheppo */ 140e1ebb9ecSlm66018 #define VDC_GET_NEXT_REQ_ID(vdc) ((vdc)->req_id++) 1411ae08745Sheppo 1421ae08745Sheppo #define VDC_GET_DRING_ENTRY_PTR(vdc, idx) \ 143*17cadca8Slm66018 (vd_dring_entry_t *)(uintptr_t)((vdc)->dring_mem_info.vaddr + \ 144e1ebb9ecSlm66018 (idx * (vdc)->dring_entry_size)) 1451ae08745Sheppo 1461ae08745Sheppo #define VDC_MARK_DRING_ENTRY_FREE(vdc, idx) \ 1471ae08745Sheppo { \ 1481ae08745Sheppo vd_dring_entry_t *dep = NULL; \ 1491ae08745Sheppo ASSERT(vdc != NULL); \ 150*17cadca8Slm66018 ASSERT(idx < vdc->dring_len); \ 1511ae08745Sheppo ASSERT(vdc->dring_mem_info.vaddr != NULL); \ 152*17cadca8Slm66018 dep = (vd_dring_entry_t *)(uintptr_t) \ 153*17cadca8Slm66018 (vdc->dring_mem_info.vaddr + \ 1541ae08745Sheppo (idx * vdc->dring_entry_size)); \ 1551ae08745Sheppo ASSERT(dep != NULL); \ 1561ae08745Sheppo dep->hdr.dstate = VIO_DESC_FREE; \ 1571ae08745Sheppo } 1581ae08745Sheppo 1591ae08745Sheppo /* Initialise the Session ID and Sequence Num in the DRing msg */ 1601ae08745Sheppo #define VDC_INIT_DRING_DATA_MSG_IDS(dmsg, vdc) \ 1611ae08745Sheppo ASSERT(vdc != NULL); \ 1621ae08745Sheppo dmsg.tag.vio_sid = vdc->session_id; \ 1630a55fbb7Slm66018 dmsg.seq_num = vdc->seq_num; 1641ae08745Sheppo 1651ae08745Sheppo /* 1663af08d82Slm66018 * The states that the read thread can be in. 1671ae08745Sheppo */ 1683af08d82Slm66018 typedef enum vdc_rd_state { 1693af08d82Slm66018 VDC_READ_IDLE, /* idling - conn is not up */ 1703af08d82Slm66018 VDC_READ_WAITING, /* waiting for data */ 1713af08d82Slm66018 VDC_READ_PENDING, /* pending data avail for read */ 1723af08d82Slm66018 VDC_READ_RESET /* channel was reset - stop reads */ 1733af08d82Slm66018 } vdc_rd_state_t; 1743af08d82Slm66018 1753af08d82Slm66018 /* 1763af08d82Slm66018 * The states that the vdc-vds connection can be in. 1773af08d82Slm66018 */ 1783af08d82Slm66018 typedef enum vdc_state { 1793af08d82Slm66018 VDC_STATE_INIT, /* device is initialized */ 1803af08d82Slm66018 VDC_STATE_INIT_WAITING, /* waiting for ldc connection */ 1813af08d82Slm66018 VDC_STATE_NEGOTIATE, /* doing handshake negotiation */ 1823af08d82Slm66018 VDC_STATE_HANDLE_PENDING, /* handle requests in backup dring */ 1833af08d82Slm66018 VDC_STATE_RUNNING, /* running and accepting requests */ 1843af08d82Slm66018 VDC_STATE_DETACH, /* detaching */ 1853af08d82Slm66018 VDC_STATE_RESETTING /* resetting connection with vds */ 1863af08d82Slm66018 } vdc_state_t; 1873af08d82Slm66018 1883af08d82Slm66018 /* 1893af08d82Slm66018 * The states that the vdc instance can be in. 1903af08d82Slm66018 */ 1913af08d82Slm66018 typedef enum vdc_lc_state { 1923af08d82Slm66018 VDC_LC_ATTACHING, /* driver is attaching */ 1933af08d82Slm66018 VDC_LC_ONLINE, /* driver is attached and online */ 1943af08d82Slm66018 VDC_LC_DETACHING /* driver is detaching */ 1953af08d82Slm66018 } vdc_lc_state_t; 1961ae08745Sheppo 1971ae08745Sheppo /* 1981ae08745Sheppo * Local Descriptor Ring entry 1991ae08745Sheppo * 2001ae08745Sheppo * vdc creates a Local (private) descriptor ring the same size as the 2011ae08745Sheppo * public descriptor ring it exports to vds. 2021ae08745Sheppo */ 2033af08d82Slm66018 2043af08d82Slm66018 typedef enum { 2053af08d82Slm66018 VIO_read_dir, /* read data from server */ 2063af08d82Slm66018 VIO_write_dir, /* write data to server */ 2073af08d82Slm66018 VIO_both_dir /* transfer both in and out in same buffer */ 2083af08d82Slm66018 } vio_desc_direction_t; 2093af08d82Slm66018 2103af08d82Slm66018 typedef enum { 2113af08d82Slm66018 CB_STRATEGY, /* non-blocking strategy call */ 2123af08d82Slm66018 CB_SYNC /* synchronous operation */ 2133af08d82Slm66018 } vio_cb_type_t; 2143af08d82Slm66018 2151ae08745Sheppo typedef struct vdc_local_desc { 2163af08d82Slm66018 boolean_t is_free; /* local state - inuse or not */ 2173af08d82Slm66018 2181ae08745Sheppo int operation; /* VD_OP_xxx to be performed */ 2191ae08745Sheppo caddr_t addr; /* addr passed in by consumer */ 2203af08d82Slm66018 int slice; 2213af08d82Slm66018 diskaddr_t offset; /* disk offset */ 2223af08d82Slm66018 size_t nbytes; 2233af08d82Slm66018 vio_cb_type_t cb_type; /* operation type blk/nonblk */ 2243af08d82Slm66018 void *cb_arg; /* buf passed to strategy() */ 2253af08d82Slm66018 vio_desc_direction_t dir; /* direction of transfer */ 2263af08d82Slm66018 2271ae08745Sheppo caddr_t align_addr; /* used if addr non-aligned */ 2281ae08745Sheppo ldc_mem_handle_t desc_mhdl; /* Mem handle of buf */ 2291ae08745Sheppo vd_dring_entry_t *dep; /* public Dring Entry Pointer */ 2303af08d82Slm66018 2311ae08745Sheppo } vdc_local_desc_t; 2321ae08745Sheppo 2331ae08745Sheppo /* 2341ae08745Sheppo * vdc soft state structure 2351ae08745Sheppo */ 2361ae08745Sheppo typedef struct vdc { 2371ae08745Sheppo 2381ae08745Sheppo kmutex_t lock; /* protects next 2 sections of vars */ 2393af08d82Slm66018 kcondvar_t running_cv; /* signal when upper layers can send */ 2403af08d82Slm66018 kcondvar_t initwait_cv; /* signal when ldc conn is up */ 2413af08d82Slm66018 kcondvar_t dring_free_cv; /* signal when desc is avail */ 2423af08d82Slm66018 kcondvar_t membind_cv; /* signal when mem can be bound */ 2433af08d82Slm66018 boolean_t self_reset; 2441ae08745Sheppo 2451ae08745Sheppo int initialized; /* keeps track of what's init'ed */ 2463af08d82Slm66018 vdc_lc_state_t lifecycle; /* Current state of the vdc instance */ 2473af08d82Slm66018 2480a55fbb7Slm66018 int hshake_cnt; /* number of failed handshakes */ 24978fcd0a1Sachartre uint8_t open[OTYPCNT]; /* mask of opened slices */ 25078fcd0a1Sachartre uint8_t open_excl; /* mask of exclusively opened slices */ 25178fcd0a1Sachartre ulong_t open_lyr[V_NUMPAR]; /* number of layered opens */ 2521ae08745Sheppo int dkio_flush_pending; /* # outstanding DKIO flushes */ 25378fcd0a1Sachartre int validate_pending; /* # outstanding validate request */ 25478fcd0a1Sachartre vd_disk_label_t vdisk_label; /* label type of device/disk imported */ 25578fcd0a1Sachartre struct vtoc *vtoc; /* structure to store VTOC data */ 25678fcd0a1Sachartre struct dk_geom *geom; /* structure to store geometry data */ 2571ae08745Sheppo 2583af08d82Slm66018 kthread_t *msg_proc_thr; /* main msg processing thread */ 2593af08d82Slm66018 2603af08d82Slm66018 kmutex_t read_lock; /* lock to protect read */ 2613af08d82Slm66018 kcondvar_t read_cv; /* cv to wait for READ events */ 2623af08d82Slm66018 vdc_rd_state_t read_state; /* current read state */ 2633af08d82Slm66018 2643af08d82Slm66018 uint32_t sync_op_cnt; /* num of active sync operations */ 2653af08d82Slm66018 boolean_t sync_op_pending; /* sync operation is pending */ 2663af08d82Slm66018 boolean_t sync_op_blocked; /* blocked waiting to do sync op */ 2673af08d82Slm66018 uint32_t sync_op_status; /* status of sync operation */ 2683af08d82Slm66018 kcondvar_t sync_pending_cv; /* cv wait for sync op to finish */ 2693af08d82Slm66018 kcondvar_t sync_blocked_cv; /* cv wait for other syncs to finish */ 2703af08d82Slm66018 2711ae08745Sheppo uint64_t session_id; /* common ID sent with all messages */ 2721ae08745Sheppo uint64_t seq_num; /* most recent sequence num generated */ 2731ae08745Sheppo uint64_t seq_num_reply; /* Last seq num ACK/NACK'ed by vds */ 2741ae08745Sheppo uint64_t req_id; /* Most recent Request ID generated */ 275e1ebb9ecSlm66018 uint64_t req_id_proc; /* Last request ID processed by vdc */ 2763af08d82Slm66018 vdc_state_t state; /* Current disk client-server state */ 277e1ebb9ecSlm66018 278e1ebb9ecSlm66018 dev_info_t *dip; /* device info pointer */ 279e1ebb9ecSlm66018 int instance; /* driver instance number */ 2803af08d82Slm66018 281e1ebb9ecSlm66018 vio_ver_t ver; /* version number agreed with server */ 2821ae08745Sheppo vd_disk_type_t vdisk_type; /* type of device/disk being imported */ 283*17cadca8Slm66018 uint32_t vdisk_media; /* physical media type of vDisk */ 2844bac2208Snarayan uint64_t vdisk_size; /* device size in blocks */ 2851ae08745Sheppo uint64_t max_xfer_sz; /* maximum block size of a descriptor */ 2861ae08745Sheppo uint64_t block_size; /* device block size used */ 287*17cadca8Slm66018 uint64_t operations; /* bitmask of ops. server supports */ 2881ae08745Sheppo struct dk_cinfo *cinfo; /* structure to store DKIOCINFO data */ 2891ae08745Sheppo struct dk_minfo *minfo; /* structure for DKIOCGMEDIAINFO data */ 2904bac2208Snarayan ddi_devid_t devid; /* device id */ 291655fd6a9Sachartre uint64_t ctimeout; /* connection timeout in seconds */ 292655fd6a9Sachartre boolean_t ctimeout_reached; /* connection timeout has expired */ 2931ae08745Sheppo 2943af08d82Slm66018 ldc_mem_info_t dring_mem_info; /* dring information */ 2953af08d82Slm66018 uint_t dring_curr_idx; /* current index */ 2963af08d82Slm66018 uint32_t dring_len; /* dring length */ 2973af08d82Slm66018 uint32_t dring_max_cookies; /* dring max cookies */ 2983af08d82Slm66018 uint32_t dring_cookie_count; /* num cookies */ 2993af08d82Slm66018 uint32_t dring_entry_size; /* descriptor size */ 3003af08d82Slm66018 ldc_mem_cookie_t *dring_cookie; /* dring cookies */ 3013af08d82Slm66018 uint64_t dring_ident; /* dring ident */ 3021ae08745Sheppo 3033af08d82Slm66018 uint64_t threads_pending; /* num of threads */ 3041ae08745Sheppo 3053af08d82Slm66018 vdc_local_desc_t *local_dring; /* local dring */ 3063af08d82Slm66018 vdc_local_desc_t *local_dring_backup; /* local dring backup */ 3073af08d82Slm66018 int local_dring_backup_tail; /* backup dring tail */ 3083af08d82Slm66018 int local_dring_backup_len; /* backup dring len */ 3091ae08745Sheppo 3103af08d82Slm66018 uint64_t ldc_id; /* LDC channel id */ 3113af08d82Slm66018 ldc_status_t ldc_state; /* LDC channel state */ 3123af08d82Slm66018 ldc_handle_t ldc_handle; /* LDC handle */ 3133af08d82Slm66018 ldc_dring_handle_t ldc_dring_hdl; /* LDC dring handle */ 3141ae08745Sheppo } vdc_t; 3151ae08745Sheppo 3161ae08745Sheppo /* 3171ae08745Sheppo * Debugging macros 3181ae08745Sheppo */ 3191ae08745Sheppo #ifdef DEBUG 3201ae08745Sheppo extern int vdc_msglevel; 3213af08d82Slm66018 extern uint64_t vdc_matchinst; 3221ae08745Sheppo 3233af08d82Slm66018 #define DMSG(_vdc, err_level, format, ...) \ 3243af08d82Slm66018 do { \ 3253af08d82Slm66018 if (vdc_msglevel > err_level && \ 3263af08d82Slm66018 (vdc_matchinst & (1ull << (_vdc)->instance))) \ 3273af08d82Slm66018 cmn_err(CE_CONT, "?[%d,t@%p] %s: "format, \ 3283af08d82Slm66018 (_vdc)->instance, (void *)curthread, \ 3293af08d82Slm66018 __func__, __VA_ARGS__); \ 3303af08d82Slm66018 _NOTE(CONSTANTCONDITION) \ 3313af08d82Slm66018 } while (0); 3323af08d82Slm66018 3333af08d82Slm66018 #define DMSGX(err_level, format, ...) \ 334e1ebb9ecSlm66018 do { \ 335e1ebb9ecSlm66018 if (vdc_msglevel > err_level) \ 3363af08d82Slm66018 cmn_err(CE_CONT, "?%s: "format, __func__, __VA_ARGS__);\ 337e1ebb9ecSlm66018 _NOTE(CONSTANTCONDITION) \ 338e1ebb9ecSlm66018 } while (0); 3391ae08745Sheppo 3401ae08745Sheppo #define VDC_DUMP_DRING_MSG(dmsgp) \ 3413af08d82Slm66018 DMSGX(0, "sq:%lu start:%d end:%d ident:%lu\n", \ 3421ae08745Sheppo dmsgp->seq_num, dmsgp->start_idx, \ 3431ae08745Sheppo dmsgp->end_idx, dmsgp->dring_ident); 3441ae08745Sheppo 3451ae08745Sheppo #else /* !DEBUG */ 346e1ebb9ecSlm66018 #define DMSG(err_level, ...) 3473af08d82Slm66018 #define DMSGX(err_level, format, ...) 3481ae08745Sheppo #define VDC_DUMP_DRING_MSG(dmsgp) 3491ae08745Sheppo 3501ae08745Sheppo #endif /* !DEBUG */ 3511ae08745Sheppo 3521ae08745Sheppo #ifdef __cplusplus 3531ae08745Sheppo } 3541ae08745Sheppo #endif 3551ae08745Sheppo 3561ae08745Sheppo #endif /* _VDC_H */ 357