xref: /illumos-gate/usr/src/uts/common/io/fibre-channel/ulp/fcip.c (revision 1ec00b5abd071c76e2dc0cfa7905965b6b7a89a9)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  * Copyright (c) 2016 by Delphix. All rights reserved.
25  */
26 
27 /*
28  * SunOS 5.x Multithreaded STREAMS DLPI FCIP Module
29  * This is a pseudo driver module to handle encapsulation of IP and ARP
30  * datagrams over FibreChannel interfaces. FCIP is a cloneable STREAMS
31  * driver module which interfaces with IP/ARP using DLPI. This module
32  * is a Style-2 DLS provider.
33  *
34  * The implementation of this module is based on RFC 2625 which gives
35  * details on the encapsulation of IP/ARP data over FibreChannel.
36  * The fcip module needs to resolve an IP address to a port address before
37  * sending data to a destination port. A FC device port has 2 addresses
38  * associated with it: A 8 byte World Wide unique Port Name and a 3 byte
39  * volatile Port number or Port_ID.
40  *
41  * The mapping between a IP address and the World Wide Port Name is handled
42  * by the ARP layer since the IP over FC draft requires the MAC address to
43  * be the least significant six bytes of the WorldWide Port Names. The
44  * fcip module however needs to identify the destination port uniquely when
45  * the destination FC device has multiple FC ports.
46  *
47  * The FC layer mapping between the World Wide Port Name and the Port_ID
48  * will be handled through the use of a fabric name server or through the
49  * use of the FARP ELS command as described in the draft. Since the Port_IDs
50  * are volatile, the mapping between the World Wide Port Name and Port_IDs
51  * must be maintained and validated before use each time a datagram
52  * needs to be sent to the destination ports. The FC transport module
53  * informs the fcip module of all changes to states of ports on the
54  * fabric through registered callbacks. This enables the fcip module
55  * to maintain the WW_PN to Port_ID mappings current.
56  *
57  * For details on how this module interfaces with the FibreChannel Transport
58  * modules, refer to PSARC/1997/385. Chapter 3 of the FibreChannel Transport
59  * Programming guide details the APIs between ULPs and the Transport.
60  *
61  * Now for some Caveats:
62  *
63  * RFC 2625 requires that a FibreChannel Port name (the Port WWN) have
64  * the NAA bits set to '0001' indicating a IEEE 48bit address which
65  * corresponds to a ULA (Universal LAN MAC address). But with FibreChannel
66  * adapters containing 2 or more ports, IEEE naming cannot identify the
67  * ports on an adapter uniquely so we will in the first implementation
68  * be operating only on Port 0 of each adapter.
69  */
70 
71 #include	<sys/types.h>
72 #include	<sys/errno.h>
73 #include	<sys/debug.h>
74 #include	<sys/time.h>
75 #include	<sys/sysmacros.h>
76 #include	<sys/systm.h>
77 #include	<sys/user.h>
78 #include	<sys/stropts.h>
79 #include	<sys/stream.h>
80 #include	<sys/strlog.h>
81 #include	<sys/strsubr.h>
82 #include	<sys/cmn_err.h>
83 #include	<sys/cpu.h>
84 #include	<sys/kmem.h>
85 #include	<sys/conf.h>
86 #include	<sys/ddi.h>
87 #include	<sys/sunddi.h>
88 #include	<sys/ksynch.h>
89 #include	<sys/stat.h>
90 #include	<sys/kstat.h>
91 #include	<sys/vtrace.h>
92 #include	<sys/strsun.h>
93 #include	<sys/varargs.h>
94 #include	<sys/modctl.h>
95 #include 	<sys/thread.h>
96 #include 	<sys/var.h>
97 #include 	<sys/proc.h>
98 #include	<inet/common.h>
99 #include	<netinet/ip6.h>
100 #include	<inet/ip.h>
101 #include	<inet/arp.h>
102 #include	<inet/mi.h>
103 #include	<inet/nd.h>
104 #include	<sys/dlpi.h>
105 #include	<sys/ethernet.h>
106 #include	<sys/file.h>
107 #include	<sys/syslog.h>
108 #include	<sys/disp.h>
109 #include	<sys/taskq.h>
110 
111 /*
112  * Leadville includes
113  */
114 
115 #include	<sys/fibre-channel/fc.h>
116 #include	<sys/fibre-channel/impl/fc_ulpif.h>
117 #include	<sys/fibre-channel/ulp/fcip.h>
118 
119 /*
120  * TNF Probe/trace facility include
121  */
122 #if defined(lint) || defined(FCIP_TNF_ENABLED)
123 #include <sys/tnf_probe.h>
124 #endif
125 
126 #define	FCIP_ESBALLOC
127 
128 /*
129  * Function prototypes
130  */
131 
132 /* standard loadable modules entry points */
133 static int	fcip_attach(dev_info_t *, ddi_attach_cmd_t);
134 static int 	fcip_detach(dev_info_t *, ddi_detach_cmd_t);
135 static void 	fcip_dodetach(struct fcipstr *slp);
136 static int fcip_getinfo(dev_info_t *dip, ddi_info_cmd_t cmd,
137     void *arg, void **result);
138 
139 
140 /* streams specific */
141 static void fcip_setipq(struct fcip *fptr);
142 static int fcip_wput(queue_t *, mblk_t *);
143 static int fcip_wsrv(queue_t *);
144 static void fcip_proto(queue_t *, mblk_t *);
145 static void fcip_ioctl(queue_t *, mblk_t *);
146 static int fcip_open(queue_t *wq, dev_t *devp, int flag,
147 		int sflag, cred_t *credp);
148 static int fcip_close(queue_t *rq, int flag, cred_t *credp);
149 static int fcip_start(queue_t *wq, mblk_t *mp, struct fcip *fptr,
150     struct fcip_dest *fdestp, int flags);
151 static void fcip_sendup(struct fcip *fptr, mblk_t *mp,
152     struct fcipstr *(*acceptfunc)());
153 static struct fcipstr *fcip_accept(struct fcipstr *slp, struct fcip *fptr,
154     int type, la_wwn_t *dhostp);
155 static mblk_t *fcip_addudind(struct fcip *fptr, mblk_t *mp,
156     fcph_network_hdr_t *nhdr, int type);
157 static int fcip_setup_mac_addr(struct fcip *fptr);
158 static void fcip_kstat_init(struct fcip *fptr);
159 static int fcip_stat_update(kstat_t *, int);
160 
161 
162 /* dlpi specific */
163 static void fcip_spareq(queue_t *wq, mblk_t *mp);
164 static void fcip_pareq(queue_t *wq, mblk_t *mp);
165 static void fcip_ubreq(queue_t *wq, mblk_t *mp);
166 static void fcip_breq(queue_t *wq, mblk_t *mp);
167 static void fcip_dreq(queue_t *wq, mblk_t *mp);
168 static void fcip_areq(queue_t *wq, mblk_t *mp);
169 static void fcip_udreq(queue_t *wq, mblk_t *mp);
170 static void fcip_ireq(queue_t *wq, mblk_t *mp);
171 static void fcip_dl_ioc_hdr_info(queue_t *wq, mblk_t *mp);
172 
173 
174 /* solaris sundry, DR/CPR etc */
175 static int fcip_cache_constructor(void *buf, void *arg, int size);
176 static void fcip_cache_destructor(void *buf, void *size);
177 static int fcip_handle_suspend(fcip_port_info_t *fport, fc_detach_cmd_t cmd);
178 static int fcip_handle_resume(fcip_port_info_t *fport,
179     fc_ulp_port_info_t *port_info, fc_attach_cmd_t cmd);
180 static fcip_port_info_t *fcip_softstate_free(fcip_port_info_t *fport);
181 static int fcip_port_attach_handler(struct fcip *fptr);
182 
183 
184 /*
185  * ulp - transport interface function prototypes
186  */
187 static int fcip_port_attach(opaque_t ulp_handle, fc_ulp_port_info_t *,
188     fc_attach_cmd_t cmd, uint32_t sid);
189 static int fcip_port_detach(opaque_t ulp_handle, fc_ulp_port_info_t *,
190     fc_detach_cmd_t cmd);
191 static int fcip_port_ioctl(opaque_t ulp_handle,  opaque_t port_handle,
192     dev_t dev, int cmd, intptr_t data, int mode, cred_t *credp, int *rval,
193     uint32_t claimed);
194 static void fcip_statec_cb(opaque_t ulp_handle, opaque_t phandle,
195     uint32_t port_state, uint32_t port_top, fc_portmap_t changelist[],
196     uint32_t listlen, uint32_t sid);
197 static int fcip_els_cb(opaque_t ulp_handle, opaque_t phandle,
198     fc_unsol_buf_t *buf, uint32_t claimed);
199 static int fcip_data_cb(opaque_t ulp_handle, opaque_t phandle,
200     fc_unsol_buf_t *payload, uint32_t claimed);
201 
202 
203 /* Routing table specific */
204 static void fcip_handle_topology(struct fcip *fptr);
205 static int fcip_init_port(struct fcip *fptr);
206 struct fcip_routing_table *fcip_lookup_rtable(struct fcip *fptr,
207     la_wwn_t *pwwn, int matchflag);
208 static void fcip_rt_update(struct fcip *fptr, fc_portmap_t *devlist,
209     uint32_t listlen);
210 static void fcip_rt_flush(struct fcip *fptr);
211 static void fcip_rte_remove_deferred(void *arg);
212 static int fcip_do_plogi(struct fcip *fptr, struct fcip_routing_table *frp);
213 
214 
215 /* dest table specific */
216 static struct fcip_dest *fcip_get_dest(struct fcip *fptr,
217     la_wwn_t *dlphys);
218 static struct fcip_dest *fcip_add_dest(struct fcip *fptr,
219     struct fcip_routing_table *frp);
220 static int fcip_dest_add_broadcast_entry(struct fcip *fptr, int new_flag);
221 static uint32_t fcip_get_broadcast_did(struct fcip *fptr);
222 static void fcip_cleanup_dest(struct fcip *fptr);
223 
224 
225 /* helper functions */
226 static fcip_port_info_t *fcip_get_port(opaque_t phandle);
227 static int fcip_wwn_compare(la_wwn_t *wwn1, la_wwn_t *wwn2, int flag);
228 static void fcip_ether_to_str(struct ether_addr *e, caddr_t s);
229 static int fcip_port_get_num_pkts(struct fcip *fptr);
230 static int fcip_check_port_busy(struct fcip *fptr);
231 static void fcip_check_remove_minor_node(void);
232 static int fcip_set_wwn(la_wwn_t *pwwn);
233 static int fcip_plogi_in_progress(struct fcip *fptr);
234 static int fcip_check_port_exists(struct fcip *fptr);
235 static int fcip_is_supported_fc_topology(int fc_topology);
236 
237 
238 /* pkt specific */
239 static fcip_pkt_t *fcip_pkt_alloc(struct fcip *fptr, mblk_t *bp,
240     int flags, int datalen);
241 static void fcip_pkt_free(struct fcip_pkt *fcip_pkt, int flags);
242 static fcip_pkt_t *fcip_ipkt_alloc(struct fcip *fptr, int cmdlen,
243     int resplen, opaque_t pd, int flags);
244 static void fcip_ipkt_free(fcip_pkt_t *fcip_pkt);
245 static void fcip_ipkt_callback(fc_packet_t *fc_pkt);
246 static void fcip_free_pkt_dma(fcip_pkt_t *fcip_pkt);
247 static void fcip_pkt_callback(fc_packet_t *fc_pkt);
248 static void fcip_init_unicast_pkt(fcip_pkt_t *fcip_pkt, fc_portid_t sid,
249     fc_portid_t did, void (*comp) ());
250 static int fcip_transport(fcip_pkt_t *fcip_pkt);
251 static void fcip_pkt_timeout(void *arg);
252 static void fcip_timeout(void *arg);
253 static void fcip_fdestp_enqueue_pkt(struct fcip_dest *fdestp,
254     fcip_pkt_t *fcip_pkt);
255 static int fcip_fdestp_dequeue_pkt(struct fcip_dest *fdestp,
256     fcip_pkt_t *fcip_pkt);
257 static int fcip_sendup_constructor(void *buf, void *arg, int flags);
258 static void fcip_sendup_thr(void *arg);
259 static int fcip_sendup_alloc_enque(struct fcip *ftpr, mblk_t *mp,
260     struct fcipstr *(*f)());
261 
262 /*
263  * zero copy inbound data handling
264  */
265 #ifdef FCIP_ESBALLOC
266 static void fcip_ubfree(char *arg);
267 #endif /* FCIP_ESBALLOC */
268 
269 #if !defined(FCIP_ESBALLOC)
270 static void *fcip_allocb(size_t size, uint_t pri);
271 #endif
272 
273 
274 /* FCIP FARP support functions */
275 static struct fcip_dest *fcip_do_farp(struct fcip *fptr, la_wwn_t *pwwn,
276     char *ip_addr, size_t ip_addr_len, int flags);
277 static void fcip_init_broadcast_pkt(fcip_pkt_t *fcip_pkt, void (*comp) (),
278     int is_els);
279 static int fcip_handle_farp_request(struct fcip *fptr, la_els_farp_t *fcmd);
280 static int fcip_handle_farp_response(struct fcip *fptr, la_els_farp_t *fcmd);
281 static void fcip_cache_arp_broadcast(struct fcip *ftpr, fc_unsol_buf_t *buf);
282 static void fcip_port_ns(void *arg);
283 
284 #ifdef DEBUG
285 
286 #include <sys/debug.h>
287 
288 #define	FCIP_DEBUG_DEFAULT	0x1
289 #define	FCIP_DEBUG_ATTACH	0x2
290 #define	FCIP_DEBUG_INIT		0x4
291 #define	FCIP_DEBUG_DETACH	0x8
292 #define	FCIP_DEBUG_DLPI		0x10
293 #define	FCIP_DEBUG_ELS		0x20
294 #define	FCIP_DEBUG_DOWNSTREAM	0x40
295 #define	FCIP_DEBUG_UPSTREAM	0x80
296 #define	FCIP_DEBUG_MISC		0x100
297 
298 #define	FCIP_DEBUG_STARTUP	(FCIP_DEBUG_ATTACH|FCIP_DEBUG_INIT)
299 #define	FCIP_DEBUG_DATAOUT	(FCIP_DEBUG_DLPI|FCIP_DEBUG_DOWNSTREAM)
300 #define	FCIP_DEBUG_DATAIN	(FCIP_DEBUG_ELS|FCIP_DEBUG_UPSTREAM)
301 
302 static int fcip_debug = FCIP_DEBUG_DEFAULT;
303 
304 #define	FCIP_DEBUG(level, args)	\
305 	if (fcip_debug & (level))	cmn_err args;
306 
307 #else	/* DEBUG */
308 
309 #define	FCIP_DEBUG(level, args)		/* do nothing */
310 
311 #endif	/* DEBUG */
312 
313 #define	KIOIP	KSTAT_INTR_PTR(fcip->fcip_intrstats)
314 
315 /*
316  * Endian independent ethernet to WWN copy
317  */
318 #define	ether_to_wwn(E, W)	\
319 	bzero((void *)(W), sizeof (la_wwn_t)); \
320 	bcopy((void *)(E), (void *)&((W)->raw_wwn[2]), ETHERADDRL); \
321 	(W)->raw_wwn[0] |= 0x10
322 
323 /*
324  * wwn_to_ether : Endian independent, copies a WWN to struct ether_addr.
325  * The args to the macro are pointers to WWN and ether_addr structures
326  */
327 #define	wwn_to_ether(W, E)	\
328 	bcopy((void *)&((W)->raw_wwn[2]), (void *)E, ETHERADDRL)
329 
330 /*
331  * The module_info structure contains identification and limit values.
332  * All queues associated with a certain driver share the same module_info
333  * structures. This structure defines the characteristics of that driver/
334  * module's queues. The module name must be unique. The max and min packet
335  * sizes limit the no. of characters in M_DATA messages. The Hi and Lo
336  * water marks are for flow control when a module has a service procedure.
337  */
338 static struct module_info	fcipminfo = {
339 	FCIPIDNUM,	/* mi_idnum : Module ID num */
340 	FCIPNAME, 	/* mi_idname: Module Name */
341 	FCIPMINPSZ,	/* mi_minpsz: Min packet size */
342 	FCIPMAXPSZ,	/* mi_maxpsz: Max packet size */
343 	FCIPHIWAT,	/* mi_hiwat : High water mark */
344 	FCIPLOWAT	/* mi_lowat : Low water mark */
345 };
346 
347 /*
348  * The qinit structres contain the module put, service. open and close
349  * procedure pointers. All modules and drivers with the same streamtab
350  * file (i.e same fmodsw or cdevsw entry points) point to the same
351  * upstream (read) and downstream (write) qinit structs.
352  */
353 static struct qinit	fcip_rinit = {
354 	NULL,		/* qi_putp */
355 	NULL,		/* qi_srvp */
356 	fcip_open,	/* qi_qopen */
357 	fcip_close,	/* qi_qclose */
358 	NULL,		/* qi_qadmin */
359 	&fcipminfo,	/* qi_minfo */
360 	NULL		/* qi_mstat */
361 };
362 
363 static struct qinit	fcip_winit = {
364 	fcip_wput,	/* qi_putp */
365 	fcip_wsrv,	/* qi_srvp */
366 	NULL,		/* qi_qopen */
367 	NULL,		/* qi_qclose */
368 	NULL,		/* qi_qadmin */
369 	&fcipminfo,	/* qi_minfo */
370 	NULL		/* qi_mstat */
371 };
372 
373 /*
374  * streamtab contains pointers to the read and write qinit structures
375  */
376 
377 static struct streamtab fcip_info = {
378 	&fcip_rinit,	/* st_rdinit */
379 	&fcip_winit,	/* st_wrinit */
380 	NULL,		/* st_muxrinit */
381 	NULL,		/* st_muxwrinit */
382 };
383 
384 static struct cb_ops  fcip_cb_ops = {
385 	nodev,				/* open */
386 	nodev,				/* close */
387 	nodev,				/* strategy */
388 	nodev,				/* print */
389 	nodev,				/* dump */
390 	nodev,				/* read */
391 	nodev,				/* write */
392 	nodev,				/* ioctl */
393 	nodev,				/* devmap */
394 	nodev,				/* mmap */
395 	nodev,				/* segmap */
396 	nochpoll,			/* poll */
397 	ddi_prop_op,			/* cb_prop_op */
398 	&fcip_info,			/* streamtab  */
399 	D_MP | D_HOTPLUG,		/* Driver compatibility flag */
400 	CB_REV,				/* rev */
401 	nodev,				/* int (*cb_aread)() */
402 	nodev				/* int (*cb_awrite)() */
403 };
404 
405 /*
406  * autoconfiguration routines.
407  */
408 static struct dev_ops fcip_ops = {
409 	DEVO_REV,		/* devo_rev, */
410 	0,			/* refcnt  */
411 	fcip_getinfo,		/* info */
412 	nulldev,		/* identify */
413 	nulldev,		/* probe */
414 	fcip_attach,		/* attach */
415 	fcip_detach,		/* detach */
416 	nodev,			/* RESET */
417 	&fcip_cb_ops,		/* driver operations */
418 	NULL,			/* bus operations */
419 	ddi_power		/* power management */
420 };
421 
422 #define	FCIP_VERSION	"1.61"
423 #define	FCIP_NAME	"SunFC FCIP v" FCIP_VERSION
424 
425 #define	PORT_DRIVER	"fp"
426 
427 #define	GETSTRUCT(struct, number)	\
428 	((struct *)kmem_zalloc((size_t)(sizeof (struct) * (number)), \
429 		KM_SLEEP))
430 
431 static struct modldrv modldrv = {
432 	&mod_driverops,			/* Type of module - driver */
433 	FCIP_NAME,			/* Name of module */
434 	&fcip_ops,			/* driver ops */
435 };
436 
437 static struct modlinkage modlinkage = {
438 	MODREV_1, (void *)&modldrv, NULL
439 };
440 
441 
442 /*
443  * Now for some global statics
444  */
445 static uint32_t	fcip_ub_nbufs = FCIP_UB_NBUFS;
446 static uint32_t fcip_ub_size = FCIP_UB_SIZE;
447 static int fcip_pkt_ttl_ticks = FCIP_PKT_TTL;
448 static int fcip_tick_incr = 1;
449 static int fcip_wait_cmds = FCIP_WAIT_CMDS;
450 static int fcip_num_attaching = 0;
451 static int fcip_port_attach_pending = 0;
452 static int fcip_create_nodes_on_demand = 1;	/* keep it similar to fcp */
453 static int fcip_cache_on_arp_broadcast = 0;
454 static int fcip_farp_supported = 0;
455 static int fcip_minor_node_created = 0;
456 
457 /*
458  * Supported FCAs
459  */
460 #define	QLC_PORT_1_ID_BITS		0x100
461 #define	QLC_PORT_2_ID_BITS		0x101
462 #define	QLC_PORT_NAA			0x2
463 #define	QLC_MODULE_NAME			"qlc"
464 #define	IS_QLC_PORT(port_dip)		\
465 			(strcmp(ddi_driver_name(ddi_get_parent((port_dip))),\
466 			QLC_MODULE_NAME) == 0)
467 
468 
469 /*
470  * fcip softstate structures head.
471  */
472 
473 static void *fcip_softp = NULL;
474 
475 /*
476  * linked list of active (inuse) driver streams
477  */
478 
479 static int fcip_num_instances = 0;
480 static dev_info_t *fcip_module_dip = (dev_info_t *)0;
481 
482 
483 /*
484  * Ethernet broadcast address: Broadcast addressing in IP over fibre
485  * channel should be the IEEE ULA (also the low 6 bytes of the Port WWN).
486  *
487  * The broadcast addressing varies for differing topologies a node may be in:
488  *	- On a private loop the ARP broadcast is a class 3 sequence sent
489  *	  using OPNfr (Open Broadcast Replicate primitive) followed by
490  *	  the ARP frame to D_ID 0xFFFFFF
491  *
492  *	- On a public Loop the broadcast sequence is sent to AL_PA 0x00
493  *	  (no OPNfr primitive).
494  *
495  *	- For direct attach and point to point topologies we just send
496  *	  the frame to D_ID 0xFFFFFF
497  *
498  * For public loop the handling would probably be different - for now
499  * I'll just declare this struct - It can be deleted if not necessary.
500  *
501  */
502 
503 
504 /*
505  * DL_INFO_ACK template for the fcip module. The dl_info_ack_t structure is
506  * returned as a part of an  DL_INFO_ACK message which is a M_PCPROTO message
507  * returned in response to a DL_INFO_REQ message sent to us from a DLS user
508  * Let us fake an ether header as much as possible.
509  *
510  * dl_addr_length is the Provider's DLSAP addr which is SAP addr +
511  *                Physical addr of the provider. We set this to
512  *                ushort_t + sizeof (la_wwn_t) for Fibre Channel ports.
513  * dl_mac_type    Lets just use DL_ETHER - we can try using DL_IPFC, a new
514  *		  dlpi.h define later.
515  * dl_sap_length  -2 indicating the SAP address follows the Physical addr
516  *		  component in the DLSAP addr.
517  * dl_service_mode: DLCLDS - connectionless data link service.
518  *
519  */
520 
521 static dl_info_ack_t fcip_infoack = {
522 	DL_INFO_ACK,				/* dl_primitive */
523 	FCIPMTU,				/* dl_max_sdu */
524 	0,					/* dl_min_sdu */
525 	FCIPADDRL,				/* dl_addr_length */
526 	DL_ETHER,				/* dl_mac_type */
527 	0,					/* dl_reserved */
528 	0,					/* dl_current_state */
529 	-2,					/* dl_sap_length */
530 	DL_CLDLS,				/* dl_service_mode */
531 	0,					/* dl_qos_length */
532 	0,					/* dl_qos_offset */
533 	0,					/* dl_range_length */
534 	0,					/* dl_range_offset */
535 	DL_STYLE2,				/* dl_provider_style */
536 	sizeof (dl_info_ack_t),			/* dl_addr_offset */
537 	DL_VERSION_2,				/* dl_version */
538 	ETHERADDRL,				/* dl_brdcst_addr_length */
539 	sizeof (dl_info_ack_t) + FCIPADDRL,	/* dl_brdcst_addr_offset */
540 	0					/* dl_growth */
541 };
542 
543 /*
544  * FCIP broadcast address definition.
545  */
546 static	struct ether_addr	fcipnhbroadcastaddr = {
547 	0xff, 0xff, 0xff, 0xff, 0xff, 0xff
548 };
549 
550 /*
551  * RFC2625 requires the broadcast ARP address in the ARP data payload to
552  * be set to 0x00 00 00 00 00 00 for ARP broadcast packets
553  */
554 static	struct ether_addr	fcip_arpbroadcast_addr = {
555 	0x00, 0x00, 0x00, 0x00, 0x00, 0x00
556 };
557 
558 
559 #define	ether_bcopy(src, dest)	bcopy((src), (dest), ETHERADDRL);
560 
561 /*
562  * global kernel locks
563  */
564 static kcondvar_t	fcip_global_cv;
565 static kmutex_t		fcip_global_mutex;
566 
567 /*
568  * fctl external defines
569  */
570 extern int fc_ulp_add(fc_ulp_modinfo_t *);
571 
572 /*
573  * fctl data structures
574  */
575 
576 #define	FCIP_REV	0x07
577 
578 /* linked list of port info structures */
579 static fcip_port_info_t *fcip_port_head = NULL;
580 
581 /* linked list of fcip structures */
582 static struct fcipstr	*fcipstrup = NULL;
583 static krwlock_t	fcipstruplock;
584 
585 
586 /*
587  * Module information structure. This structure gives the FC Transport modules
588  * information about an ULP that registers with it.
589  */
590 static fc_ulp_modinfo_t	fcip_modinfo = {
591 	0,			/* for xref checks? */
592 	FCTL_ULP_MODREV_4,	/* FCIP revision */
593 	FC_TYPE_IS8802_SNAP,	/* type 5 for SNAP encapsulated datagrams */
594 	FCIP_NAME,		/* module name as in the modldrv struct */
595 	0x0,			/* get all statec callbacks for now */
596 	fcip_port_attach,	/* port attach callback */
597 	fcip_port_detach,	/* port detach callback */
598 	fcip_port_ioctl,	/* port ioctl callback */
599 	fcip_els_cb,		/* els callback */
600 	fcip_data_cb,		/* data callback */
601 	fcip_statec_cb		/* state change callback */
602 };
603 
604 
605 /*
606  * Solaris 9 and up, the /kernel/drv/fp.conf file will have the following entry
607  *
608  * ddi-forceattach=1;
609  *
610  * This will ensure that fp is loaded at bootup. No additional checks are needed
611  */
612 int
613 _init(void)
614 {
615 	int	rval;
616 
617 	FCIP_TNF_LOAD();
618 
619 	/*
620 	 * Initialize the mutexs used by port attach and other callbacks.
621 	 * The transport can call back into our port_attach_callback
622 	 * routine even before _init() completes and bad things can happen.
623 	 */
624 	mutex_init(&fcip_global_mutex, NULL, MUTEX_DRIVER, NULL);
625 	cv_init(&fcip_global_cv, NULL, CV_DRIVER, NULL);
626 	rw_init(&fcipstruplock, NULL, RW_DRIVER, NULL);
627 
628 	mutex_enter(&fcip_global_mutex);
629 	fcip_port_attach_pending = 1;
630 	mutex_exit(&fcip_global_mutex);
631 
632 	/*
633 	 * Now attempt to register fcip with the transport.
634 	 * If fc_ulp_add fails, fcip module will not be loaded.
635 	 */
636 	rval = fc_ulp_add(&fcip_modinfo);
637 	if (rval != FC_SUCCESS) {
638 		mutex_destroy(&fcip_global_mutex);
639 		cv_destroy(&fcip_global_cv);
640 		rw_destroy(&fcipstruplock);
641 		switch (rval) {
642 		case FC_ULP_SAMEMODULE:
643 			FCIP_DEBUG(FCIP_DEBUG_DEFAULT, (CE_WARN,
644 			    "!fcip: module is already registered with"
645 			    " transport"));
646 			rval = EEXIST;
647 			break;
648 		case FC_ULP_SAMETYPE:
649 			FCIP_DEBUG(FCIP_DEBUG_DEFAULT, (CE_WARN,
650 			    "!fcip: Another module of the same ULP type 0x%x"
651 			    " is already registered with the transport",
652 			    fcip_modinfo.ulp_type));
653 			rval = EEXIST;
654 			break;
655 		case FC_BADULP:
656 			FCIP_DEBUG(FCIP_DEBUG_DEFAULT, (CE_WARN,
657 			    "!fcip: Current fcip version 0x%x does not match"
658 			    " fctl version",
659 			    fcip_modinfo.ulp_rev));
660 			rval = ENODEV;
661 			break;
662 		default:
663 			FCIP_DEBUG(FCIP_DEBUG_DEFAULT, (CE_WARN,
664 			    "!fcip: fc_ulp_add failed with status 0x%x", rval));
665 			rval = ENODEV;
666 			break;
667 		}
668 		FCIP_TNF_UNLOAD(&modlinkage);
669 		return (rval);
670 	}
671 
672 	if ((rval = ddi_soft_state_init(&fcip_softp, sizeof (struct fcip),
673 			FCIP_NUM_INSTANCES)) != 0) {
674 		mutex_destroy(&fcip_global_mutex);
675 		cv_destroy(&fcip_global_cv);
676 		rw_destroy(&fcipstruplock);
677 		(void) fc_ulp_remove(&fcip_modinfo);
678 		FCIP_TNF_UNLOAD(&modlinkage);
679 		return (rval);
680 	}
681 
682 	if ((rval = mod_install(&modlinkage)) != 0) {
683 		FCIP_TNF_UNLOAD(&modlinkage);
684 		(void) fc_ulp_remove(&fcip_modinfo);
685 		mutex_destroy(&fcip_global_mutex);
686 		cv_destroy(&fcip_global_cv);
687 		rw_destroy(&fcipstruplock);
688 		ddi_soft_state_fini(&fcip_softp);
689 	}
690 	return (rval);
691 }
692 
693 /*
694  * Unload the port driver if this was the only ULP loaded and then
695  * deregister with the transport.
696  */
697 int
698 _fini(void)
699 {
700 	int	rval;
701 	int	rval1;
702 
703 	/*
704 	 * Do not permit the module to be unloaded before a port
705 	 * attach callback has happened.
706 	 */
707 	mutex_enter(&fcip_global_mutex);
708 	if (fcip_num_attaching || fcip_port_attach_pending) {
709 		mutex_exit(&fcip_global_mutex);
710 		return (EBUSY);
711 	}
712 	mutex_exit(&fcip_global_mutex);
713 
714 	if ((rval = mod_remove(&modlinkage)) != 0) {
715 		return (rval);
716 	}
717 
718 	/*
719 	 * unregister with the transport layer
720 	 */
721 	rval1 = fc_ulp_remove(&fcip_modinfo);
722 
723 	/*
724 	 * If the ULP was not registered with the transport, init should
725 	 * have failed. If transport has no knowledge of our existence
726 	 * we should simply bail out and succeed
727 	 */
728 #ifdef DEBUG
729 	if (rval1 == FC_BADULP) {
730 		FCIP_DEBUG(FCIP_DEBUG_DEFAULT, (CE_WARN,
731 		"fcip: ULP was never registered with the transport"));
732 		rval = ENODEV;
733 	} else if (rval1 == FC_BADTYPE) {
734 		FCIP_DEBUG(FCIP_DEBUG_DEFAULT, (CE_WARN,
735 			"fcip: No ULP of this type 0x%x was registered with "
736 			"transport", fcip_modinfo.ulp_type));
737 		rval = ENODEV;
738 	}
739 #endif /* DEBUG */
740 
741 	mutex_destroy(&fcip_global_mutex);
742 	rw_destroy(&fcipstruplock);
743 	cv_destroy(&fcip_global_cv);
744 	ddi_soft_state_fini(&fcip_softp);
745 
746 	FCIP_TNF_UNLOAD(&modlinkage);
747 
748 	return (rval);
749 }
750 
751 /*
752  * Info about this loadable module
753  */
754 int
755 _info(struct modinfo *modinfop)
756 {
757 	return (mod_info(&modlinkage, modinfop));
758 }
759 
760 /*
761  * The port attach callback is invoked by the port driver when a FCA
762  * port comes online and binds with the transport layer. The transport
763  * then callsback into all ULP modules registered with it. The Port attach
764  * call back will also provide the ULP module with the Port's WWN and S_ID
765  */
766 /* ARGSUSED */
767 static int
768 fcip_port_attach(opaque_t ulp_handle, fc_ulp_port_info_t *port_info,
769     fc_attach_cmd_t cmd, uint32_t sid)
770 {
771 	int 			rval = FC_FAILURE;
772 	int 			instance;
773 	struct fcip		*fptr;
774 	fcip_port_info_t	*fport = NULL;
775 	fcip_port_info_t	*cur_fport;
776 	fc_portid_t		src_id;
777 
778 	switch (cmd) {
779 	case FC_CMD_ATTACH: {
780 		la_wwn_t	*ww_pn = NULL;
781 		/*
782 		 * It was determined that, as per spec, the lower 48 bits of
783 		 * the port-WWN will always be unique. This will make the MAC
784 		 * address (i.e the lower 48 bits of the WWN), that IP/ARP
785 		 * depend on, unique too. Hence we should be able to remove the
786 		 * restriction of attaching to only one of the ports of
787 		 * multi port FCAs.
788 		 *
789 		 * Earlier, fcip used to attach only to qlc module and fail
790 		 * silently for attach failures resulting from unknown FCAs or
791 		 * unsupported FCA ports. Now, we'll do no such checks.
792 		 */
793 		ww_pn = &port_info->port_pwwn;
794 
795 		FCIP_TNF_PROBE_2((fcip_port_attach, "fcip io", /* CSTYLED */,
796 			tnf_string, msg, "port id bits",
797 			tnf_opaque, nport_id, ww_pn->w.nport_id));
798 		FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_NOTE,
799 		    "port id bits: 0x%x", ww_pn->w.nport_id));
800 		/*
801 		 * A port has come online
802 		 */
803 		mutex_enter(&fcip_global_mutex);
804 		fcip_num_instances++;
805 		fcip_num_attaching++;
806 
807 		if (fcip_port_head == NULL) {
808 			/* OK to sleep here ? */
809 			fport = kmem_zalloc(sizeof (fcip_port_info_t),
810 						KM_NOSLEEP);
811 			if (fport == NULL) {
812 				fcip_num_instances--;
813 				fcip_num_attaching--;
814 				ASSERT(fcip_num_attaching >= 0);
815 				mutex_exit(&fcip_global_mutex);
816 				rval = FC_FAILURE;
817 				cmn_err(CE_WARN, "!fcip(%d): port attach "
818 				    "failed: alloc failed",
819 				    ddi_get_instance(port_info->port_dip));
820 				goto done;
821 			}
822 			fcip_port_head = fport;
823 		} else {
824 			/*
825 			 * traverse the port list and also check for
826 			 * duplicate port attaches - Nothing wrong in being
827 			 * paranoid Heh Heh.
828 			 */
829 			cur_fport = fcip_port_head;
830 			while (cur_fport != NULL) {
831 				if (cur_fport->fcipp_handle ==
832 				    port_info->port_handle) {
833 					fcip_num_instances--;
834 					fcip_num_attaching--;
835 					ASSERT(fcip_num_attaching >= 0);
836 					mutex_exit(&fcip_global_mutex);
837 					FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_WARN,
838 					    "!fcip(%d): port already "
839 					    "attached!!", ddi_get_instance(
840 					    port_info->port_dip)));
841 					rval = FC_FAILURE;
842 					goto done;
843 				}
844 				cur_fport = cur_fport->fcipp_next;
845 			}
846 			fport = kmem_zalloc(sizeof (fcip_port_info_t),
847 						KM_NOSLEEP);
848 			if (fport == NULL) {
849 				rval = FC_FAILURE;
850 				fcip_num_instances--;
851 				fcip_num_attaching--;
852 				ASSERT(fcip_num_attaching >= 0);
853 				mutex_exit(&fcip_global_mutex);
854 				cmn_err(CE_WARN, "!fcip(%d): port attach "
855 				    "failed: alloc failed",
856 				    ddi_get_instance(port_info->port_dip));
857 				goto done;
858 			}
859 			fport->fcipp_next = fcip_port_head;
860 			fcip_port_head = fport;
861 		}
862 
863 		mutex_exit(&fcip_global_mutex);
864 
865 		/*
866 		 * now fill in the details about the port itself
867 		 */
868 		fport->fcipp_linkage = *port_info->port_linkage;
869 		fport->fcipp_handle = port_info->port_handle;
870 		fport->fcipp_dip = port_info->port_dip;
871 		fport->fcipp_topology = port_info->port_flags;
872 		fport->fcipp_pstate = port_info->port_state;
873 		fport->fcipp_naa = port_info->port_pwwn.w.naa_id;
874 		bcopy(&port_info->port_pwwn, &fport->fcipp_pwwn,
875 		    sizeof (la_wwn_t));
876 		bcopy(&port_info->port_nwwn, &fport->fcipp_nwwn,
877 		    sizeof (la_wwn_t));
878 		fport->fcipp_fca_pkt_size = port_info->port_fca_pkt_size;
879 		fport->fcipp_cmd_dma_attr = *port_info->port_cmd_dma_attr;
880 		fport->fcipp_resp_dma_attr = *port_info->port_resp_dma_attr;
881 		fport->fcipp_fca_acc_attr = *port_info->port_acc_attr;
882 		src_id.port_id = sid;
883 		src_id.priv_lilp_posit = 0;
884 		fport->fcipp_sid = src_id;
885 
886 		/*
887 		 * allocate soft state for this instance
888 		 */
889 		instance = ddi_get_instance(fport->fcipp_dip);
890 		if (ddi_soft_state_zalloc(fcip_softp,
891 		    instance) != DDI_SUCCESS) {
892 			rval = FC_FAILURE;
893 			cmn_err(CE_WARN, "!fcip(%d): port attach failed: "
894 			    "soft state alloc failed", instance);
895 			goto failure;
896 		}
897 
898 		fptr = ddi_get_soft_state(fcip_softp, instance);
899 
900 		if (fptr == NULL) {
901 			rval = FC_FAILURE;
902 			cmn_err(CE_WARN, "!fcip(%d): port attach failed: "
903 			    "failure to get soft state", instance);
904 			goto failure;
905 		}
906 
907 		/*
908 		 * initialize all mutexes and locks required for this module
909 		 */
910 		mutex_init(&fptr->fcip_mutex, NULL, MUTEX_DRIVER, NULL);
911 		mutex_init(&fptr->fcip_ub_mutex, NULL, MUTEX_DRIVER, NULL);
912 		mutex_init(&fptr->fcip_rt_mutex, NULL, MUTEX_DRIVER, NULL);
913 		mutex_init(&fptr->fcip_dest_mutex, NULL, MUTEX_DRIVER, NULL);
914 		mutex_init(&fptr->fcip_sendup_mutex, NULL, MUTEX_DRIVER, NULL);
915 		cv_init(&fptr->fcip_farp_cv, NULL, CV_DRIVER, NULL);
916 		cv_init(&fptr->fcip_sendup_cv, NULL, CV_DRIVER, NULL);
917 		cv_init(&fptr->fcip_ub_cv, NULL, CV_DRIVER, NULL);
918 
919 		mutex_enter(&fptr->fcip_mutex);
920 
921 		fptr->fcip_dip = fport->fcipp_dip;	/* parent's dip */
922 		fptr->fcip_instance = instance;
923 		fptr->fcip_ub_upstream = 0;
924 
925 		if (FC_PORT_STATE_MASK(port_info->port_state) ==
926 		    FC_STATE_ONLINE) {
927 			fptr->fcip_port_state = FCIP_PORT_ONLINE;
928 			if (fptr->fcip_flags & FCIP_LINK_DOWN) {
929 				fptr->fcip_flags &= ~FCIP_LINK_DOWN;
930 			}
931 		} else {
932 			fptr->fcip_port_state = FCIP_PORT_OFFLINE;
933 		}
934 
935 		fptr->fcip_flags |= FCIP_ATTACHING;
936 		fptr->fcip_port_info = fport;
937 
938 		/*
939 		 * Extract our MAC addr from our port's WWN. The lower 48
940 		 * bits will be our MAC address
941 		 */
942 		wwn_to_ether(&fport->fcipp_nwwn, &fptr->fcip_macaddr);
943 
944 		fport->fcipp_fcip = fptr;
945 
946 		FCIP_DEBUG(FCIP_DEBUG_ATTACH,
947 		    (CE_NOTE, "fcipdest : 0x%lx, rtable : 0x%lx",
948 		    (long)(sizeof (fptr->fcip_dest)),
949 		    (long)(sizeof (fptr->fcip_rtable))));
950 
951 		bzero(fptr->fcip_dest, sizeof (fptr->fcip_dest));
952 		bzero(fptr->fcip_rtable, sizeof (fptr->fcip_rtable));
953 
954 		/*
955 		 * create a taskq to handle sundry jobs for the driver
956 		 * This way we can have jobs run in parallel
957 		 */
958 		fptr->fcip_tq = taskq_create("fcip_tasks",
959 		    FCIP_NUM_THREADS, MINCLSYSPRI, FCIP_MIN_TASKS,
960 		    FCIP_MAX_TASKS, TASKQ_PREPOPULATE);
961 
962 		mutex_exit(&fptr->fcip_mutex);
963 
964 		/*
965 		 * create a separate thread to handle all unsolicited
966 		 * callback handling. This is because unsolicited_callback
967 		 * can happen from an interrupt context and the upstream
968 		 * modules can put new messages right back in the same
969 		 * thread context. This usually works fine, but sometimes
970 		 * we may have to block to obtain the dest struct entries
971 		 * for some remote ports.
972 		 */
973 		mutex_enter(&fptr->fcip_sendup_mutex);
974 		if (thread_create(NULL, DEFAULTSTKSZ,
975 		    (void (*)())fcip_sendup_thr, (caddr_t)fptr, 0, &p0,
976 		    TS_RUN, minclsyspri) == NULL) {
977 			mutex_exit(&fptr->fcip_sendup_mutex);
978 			cmn_err(CE_WARN,
979 			    "!unable to create fcip sendup thread for "
980 			    " instance: 0x%x", instance);
981 			rval = FC_FAILURE;
982 			goto done;
983 		}
984 		fptr->fcip_sendup_thr_initted = 1;
985 		fptr->fcip_sendup_head = fptr->fcip_sendup_tail = NULL;
986 		mutex_exit(&fptr->fcip_sendup_mutex);
987 
988 
989 		/* Let the attach handler do the rest */
990 		if (fcip_port_attach_handler(fptr) != FC_SUCCESS) {
991 			/*
992 			 * We have already cleaned up so return
993 			 */
994 			rval = FC_FAILURE;
995 			cmn_err(CE_WARN, "!fcip(%d): port attach failed",
996 			    instance);
997 			goto done;
998 		}
999 
1000 		FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_CONT,
1001 		    "!fcip attach for port instance (0x%x) successful",
1002 		    instance));
1003 
1004 		rval = FC_SUCCESS;
1005 		goto done;
1006 	}
1007 	case FC_CMD_POWER_UP:
1008 	/* FALLTHROUGH */
1009 	case FC_CMD_RESUME:
1010 		mutex_enter(&fcip_global_mutex);
1011 		fport = fcip_port_head;
1012 		while (fport != NULL) {
1013 			if (fport->fcipp_handle == port_info->port_handle) {
1014 				break;
1015 			}
1016 			fport = fport->fcipp_next;
1017 		}
1018 		if (fport == NULL) {
1019 			rval = FC_SUCCESS;
1020 			mutex_exit(&fcip_global_mutex);
1021 			goto done;
1022 		}
1023 		rval = fcip_handle_resume(fport, port_info, cmd);
1024 		mutex_exit(&fcip_global_mutex);
1025 		goto done;
1026 
1027 	default:
1028 		FCIP_TNF_PROBE_2((fcip_port_attach, "fcip io", /* CSTYLED */,
1029 			tnf_string, msg, "unknown command type",
1030 			tnf_uint, cmd, cmd));
1031 		FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_WARN,
1032 		    "unknown cmd type 0x%x in port_attach", cmd));
1033 		rval = FC_FAILURE;
1034 		goto done;
1035 	}
1036 
1037 failure:
1038 	if (fport) {
1039 		mutex_enter(&fcip_global_mutex);
1040 		fcip_num_attaching--;
1041 		ASSERT(fcip_num_attaching >= 0);
1042 		(void) fcip_softstate_free(fport);
1043 		fcip_port_attach_pending = 0;
1044 		mutex_exit(&fcip_global_mutex);
1045 	}
1046 	return (rval);
1047 
1048 done:
1049 	mutex_enter(&fcip_global_mutex);
1050 	fcip_port_attach_pending = 0;
1051 	mutex_exit(&fcip_global_mutex);
1052 	return (rval);
1053 }
1054 
1055 /*
1056  * fcip_port_attach_handler : Completes the port attach operation after
1057  * the ulp_port_attach routine has completed its ground work. The job
1058  * of this function among other things is to obtain and handle topology
1059  * specifics, initialize a port, setup broadcast address entries in
1060  * the fcip tables etc. This routine cleans up behind itself on failures.
1061  * Returns FC_SUCCESS or FC_FAILURE.
1062  */
1063 static int
1064 fcip_port_attach_handler(struct fcip *fptr)
1065 {
1066 	fcip_port_info_t		*fport = fptr->fcip_port_info;
1067 	int				rval = FC_FAILURE;
1068 
1069 	ASSERT(fport != NULL);
1070 
1071 	mutex_enter(&fcip_global_mutex);
1072 
1073 	FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_NOTE,
1074 	    "fcip module dip: %p instance: %d",
1075 	    (void *)fcip_module_dip, ddi_get_instance(fptr->fcip_dip)));
1076 
1077 	if (fcip_module_dip == NULL) {
1078 		clock_t		fcip_lbolt;
1079 
1080 		fcip_lbolt = ddi_get_lbolt();
1081 		/*
1082 		 * we need to use the fcip devinfo for creating
1083 		 * the clone device node, but the fcip attach
1084 		 * (from its conf file entry claiming to be a
1085 		 * child of pseudo) may not have happened yet.
1086 		 * wait here for 10 seconds and fail port attach
1087 		 * if the fcip devinfo is not attached yet
1088 		 */
1089 		fcip_lbolt += drv_usectohz(FCIP_INIT_DELAY);
1090 
1091 		FCIP_DEBUG(FCIP_DEBUG_ATTACH,
1092 		    (CE_WARN, "cv_timedwait lbolt %lx", fcip_lbolt));
1093 
1094 		(void) cv_timedwait(&fcip_global_cv, &fcip_global_mutex,
1095 		    fcip_lbolt);
1096 
1097 		if (fcip_module_dip == NULL) {
1098 			mutex_exit(&fcip_global_mutex);
1099 
1100 			FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_WARN,
1101 				"fcip attach did not happen"));
1102 			goto port_attach_cleanup;
1103 		}
1104 	}
1105 
1106 	if ((!fcip_minor_node_created) &&
1107 	    fcip_is_supported_fc_topology(fport->fcipp_topology)) {
1108 		/*
1109 		 * Checking for same topologies which are considered valid
1110 		 * by fcip_handle_topology(). Dont create a minor node if
1111 		 * nothing is hanging off the FC port.
1112 		 */
1113 		if (ddi_create_minor_node(fcip_module_dip, "fcip", S_IFCHR,
1114 		    ddi_get_instance(fptr->fcip_dip), DDI_PSEUDO,
1115 		    CLONE_DEV) == DDI_FAILURE) {
1116 			mutex_exit(&fcip_global_mutex);
1117 			FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_WARN,
1118 			    "failed to create minor node for fcip(%d)",
1119 			    ddi_get_instance(fptr->fcip_dip)));
1120 			goto port_attach_cleanup;
1121 		}
1122 		fcip_minor_node_created++;
1123 	}
1124 	mutex_exit(&fcip_global_mutex);
1125 
1126 	/*
1127 	 * initialize port for traffic
1128 	 */
1129 	if (fcip_init_port(fptr) != FC_SUCCESS) {
1130 		/* fcip_init_port has already cleaned up its stuff */
1131 
1132 		mutex_enter(&fcip_global_mutex);
1133 
1134 		if ((fcip_num_instances == 1) &&
1135 		    (fcip_minor_node_created == 1)) {
1136 			/* Remove minor node iff this is the last instance */
1137 			ddi_remove_minor_node(fcip_module_dip, NULL);
1138 		}
1139 
1140 		mutex_exit(&fcip_global_mutex);
1141 
1142 		goto port_attach_cleanup;
1143 	}
1144 
1145 	mutex_enter(&fptr->fcip_mutex);
1146 	fptr->fcip_flags &= ~FCIP_ATTACHING;
1147 	fptr->fcip_flags |= FCIP_INITED;
1148 	fptr->fcip_timeout_ticks = 0;
1149 
1150 	/*
1151 	 * start the timeout threads
1152 	 */
1153 	fptr->fcip_timeout_id = timeout(fcip_timeout, fptr,
1154 	    drv_usectohz(1000000));
1155 
1156 	mutex_exit(&fptr->fcip_mutex);
1157 	mutex_enter(&fcip_global_mutex);
1158 	fcip_num_attaching--;
1159 	ASSERT(fcip_num_attaching >= 0);
1160 	mutex_exit(&fcip_global_mutex);
1161 	rval = FC_SUCCESS;
1162 	return (rval);
1163 
1164 port_attach_cleanup:
1165 	mutex_enter(&fcip_global_mutex);
1166 	(void) fcip_softstate_free(fport);
1167 	fcip_num_attaching--;
1168 	ASSERT(fcip_num_attaching >= 0);
1169 	mutex_exit(&fcip_global_mutex);
1170 	rval = FC_FAILURE;
1171 	return (rval);
1172 }
1173 
1174 
1175 /*
1176  * Handler for DDI_RESUME operations. Port must be ready to restart IP
1177  * traffic on resume
1178  */
1179 static int
1180 fcip_handle_resume(fcip_port_info_t *fport, fc_ulp_port_info_t *port_info,
1181     fc_attach_cmd_t cmd)
1182 {
1183 	int 		rval = FC_SUCCESS;
1184 	struct fcip	*fptr = fport->fcipp_fcip;
1185 	struct fcipstr	*tslp;
1186 	int		index;
1187 
1188 
1189 	ASSERT(fptr != NULL);
1190 
1191 	mutex_enter(&fptr->fcip_mutex);
1192 
1193 	if (cmd == FC_CMD_POWER_UP) {
1194 		fptr->fcip_flags &= ~(FCIP_POWER_DOWN);
1195 		if (fptr->fcip_flags & FCIP_SUSPENDED) {
1196 			mutex_exit(&fptr->fcip_mutex);
1197 			return (FC_SUCCESS);
1198 		}
1199 	} else if (cmd == FC_CMD_RESUME) {
1200 		fptr->fcip_flags &= ~(FCIP_SUSPENDED);
1201 	} else {
1202 		mutex_exit(&fptr->fcip_mutex);
1203 		return (FC_FAILURE);
1204 	}
1205 
1206 	/*
1207 	 * set the current port state and topology
1208 	 */
1209 	fport->fcipp_topology = port_info->port_flags;
1210 	fport->fcipp_pstate = port_info->port_state;
1211 
1212 	rw_enter(&fcipstruplock, RW_READER);
1213 	for (tslp = fcipstrup; tslp; tslp = tslp->sl_nextp) {
1214 		if (tslp->sl_fcip == fptr) {
1215 			break;
1216 		}
1217 	}
1218 	rw_exit(&fcipstruplock);
1219 
1220 	/*
1221 	 * No active streams on this port
1222 	 */
1223 	if (tslp == NULL) {
1224 		rval = FC_SUCCESS;
1225 		goto done;
1226 	}
1227 
1228 	mutex_enter(&fptr->fcip_rt_mutex);
1229 	for (index = 0; index < FCIP_RT_HASH_ELEMS; index++) {
1230 		struct fcip_routing_table 	*frp;
1231 
1232 		frp = fptr->fcip_rtable[index];
1233 		while (frp) {
1234 			uint32_t		did;
1235 			/*
1236 			 * Mark the broadcast RTE available again. It
1237 			 * was marked SUSPENDED during SUSPEND.
1238 			 */
1239 			did = fcip_get_broadcast_did(fptr);
1240 			if (frp->fcipr_d_id.port_id == did) {
1241 				frp->fcipr_state = 0;
1242 				index = FCIP_RT_HASH_ELEMS;
1243 				break;
1244 			}
1245 			frp = frp->fcipr_next;
1246 		}
1247 	}
1248 	mutex_exit(&fptr->fcip_rt_mutex);
1249 
1250 	/*
1251 	 * fcip_handle_topology will update the port entries in the
1252 	 * routing table.
1253 	 * fcip_handle_topology also takes care of resetting the
1254 	 * fcipr_state field in the routing table structure. The entries
1255 	 * were set to RT_INVALID during suspend.
1256 	 */
1257 	fcip_handle_topology(fptr);
1258 
1259 done:
1260 	/*
1261 	 * Restart the timeout thread
1262 	 */
1263 	fptr->fcip_timeout_id = timeout(fcip_timeout, fptr,
1264 	    drv_usectohz(1000000));
1265 	mutex_exit(&fptr->fcip_mutex);
1266 	return (rval);
1267 }
1268 
1269 
1270 /*
1271  * Insert a destination port entry into the routing table for
1272  * this port
1273  */
1274 static void
1275 fcip_rt_update(struct fcip *fptr, fc_portmap_t *devlist, uint32_t listlen)
1276 {
1277 	struct fcip_routing_table	*frp;
1278 	fcip_port_info_t		*fport = fptr->fcip_port_info;
1279 	int				hash_bucket, i;
1280 	fc_portmap_t			*pmap;
1281 	char				wwn_buf[20];
1282 
1283 	FCIP_TNF_PROBE_2((fcip_rt_update, "fcip io", /* CSTYLED */,
1284 		tnf_string, msg, "enter",
1285 		tnf_int, listlen, listlen));
1286 
1287 	ASSERT(!mutex_owned(&fptr->fcip_mutex));
1288 	mutex_enter(&fptr->fcip_rt_mutex);
1289 
1290 	for (i = 0; i < listlen; i++) {
1291 		pmap = &(devlist[i]);
1292 
1293 		frp = fcip_lookup_rtable(fptr, &(pmap->map_pwwn),
1294 		    FCIP_COMPARE_PWWN);
1295 		/*
1296 		 * If an entry for a port in the devlist exists in the
1297 		 * in the per port routing table, make sure the data
1298 		 * is current. We need to do this irrespective of the
1299 		 * underlying port topology.
1300 		 */
1301 		switch (pmap->map_type) {
1302 		/* FALLTHROUGH */
1303 		case PORT_DEVICE_NOCHANGE:
1304 		/* FALLTHROUGH */
1305 		case PORT_DEVICE_USER_LOGIN:
1306 		/* FALLTHROUGH */
1307 		case PORT_DEVICE_CHANGED:
1308 		/* FALLTHROUGH */
1309 		case PORT_DEVICE_NEW:
1310 			if (frp == NULL) {
1311 				goto add_new_entry;
1312 			} else if (frp) {
1313 				goto update_entry;
1314 			} else {
1315 				continue;
1316 			}
1317 
1318 		case PORT_DEVICE_OLD:
1319 		/* FALLTHROUGH */
1320 		case PORT_DEVICE_USER_LOGOUT:
1321 			/*
1322 			 * Mark entry for removal from Routing Table if
1323 			 * one exists. Let the timeout thread actually
1324 			 * remove the entry after we've given up hopes
1325 			 * of the port ever showing up.
1326 			 */
1327 			if (frp) {
1328 				uint32_t		did;
1329 
1330 				/*
1331 				 * Mark the routing table as invalid to bail
1332 				 * the packets early that are in transit
1333 				 */
1334 				did = fptr->fcip_broadcast_did;
1335 				if (frp->fcipr_d_id.port_id != did) {
1336 					frp->fcipr_pd = NULL;
1337 					frp->fcipr_state = FCIP_RT_INVALID;
1338 					frp->fcipr_invalid_timeout =
1339 					    fptr->fcip_timeout_ticks +
1340 					    FCIP_RTE_TIMEOUT;
1341 				}
1342 			}
1343 			continue;
1344 
1345 		default:
1346 			FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_WARN,
1347 			    "unknown map flags in rt_update"));
1348 			continue;
1349 		}
1350 add_new_entry:
1351 		ASSERT(frp == NULL);
1352 		hash_bucket = FCIP_RT_HASH(pmap->map_pwwn.raw_wwn);
1353 
1354 		ASSERT(hash_bucket < FCIP_RT_HASH_ELEMS);
1355 
1356 		FCIP_TNF_PROBE_2((fcip_rt_update, "cfip io", /* CSTYLED */,
1357 			tnf_string, msg,
1358 			"add new entry",
1359 			tnf_int, hashbucket, hash_bucket));
1360 
1361 		frp = (struct fcip_routing_table *)
1362 		    kmem_zalloc(sizeof (struct fcip_routing_table), KM_SLEEP);
1363 		/* insert at beginning of hash bucket */
1364 		frp->fcipr_next = fptr->fcip_rtable[hash_bucket];
1365 		fptr->fcip_rtable[hash_bucket] = frp;
1366 		fc_wwn_to_str(&pmap->map_pwwn, wwn_buf);
1367 		FCIP_DEBUG(FCIP_DEBUG_ATTACH, (CE_NOTE,
1368 		    "added entry for pwwn %s and d_id 0x%x",
1369 		    wwn_buf, pmap->map_did.port_id));
1370 update_entry:
1371 		bcopy((void *)&pmap->map_pwwn,
1372 		    (void *)&frp->fcipr_pwwn, sizeof (la_wwn_t));
1373 		bcopy((void *)&pmap->map_nwwn, (void *)&frp->fcipr_nwwn,
1374 		    sizeof (la_wwn_t));
1375 		frp->fcipr_d_id = pmap->map_did;
1376 		frp->fcipr_state = pmap->map_state;
1377 		frp->fcipr_pd = pmap->map_pd;
1378 
1379 		/*
1380 		 * If there is no pd for a destination port that is not
1381 		 * a broadcast entry, the port is pretty much unusable - so
1382 		 * mark the port for removal so we can try adding back the
1383 		 * entry again.
1384 		 */
1385 		if ((frp->fcipr_pd == NULL) &&
1386 		    (frp->fcipr_d_id.port_id != fptr->fcip_broadcast_did)) {
1387 			frp->fcipr_state = PORT_DEVICE_INVALID;
1388 			frp->fcipr_invalid_timeout = fptr->fcip_timeout_ticks +
1389 			    (FCIP_RTE_TIMEOUT / 2);
1390 		}
1391 		frp->fcipr_fca_dev =
1392 		    fc_ulp_get_fca_device(fport->fcipp_handle, pmap->map_did);
1393 
1394 		/*
1395 		 * login to the remote port. Don't worry about
1396 		 * plogi failures for now
1397 		 */
1398 		if (pmap->map_pd != NULL) {
1399 			(void) fcip_do_plogi(fptr, frp);
1400 		} else if (FC_TOP_EXTERNAL(fport->fcipp_topology)) {
1401 			fc_wwn_to_str(&frp->fcipr_pwwn, wwn_buf);
1402 			FCIP_DEBUG(FCIP_DEBUG_MISC, (CE_NOTE,
1403 			    "logging into pwwn %s, d_id 0x%x",
1404 			    wwn_buf, frp->fcipr_d_id.port_id));
1405 			(void) fcip_do_plogi(fptr, frp);
1406 		}
1407 
1408 		FCIP_TNF_BYTE_ARRAY(fcip_rt_update, "fcip io", "detail",
1409 			"new wwn in rt", pwwn,
1410 			&frp->fcipr_pwwn, sizeof (la_wwn_t));
1411 	}
1412 	mutex_exit(&fptr->fcip_rt_mutex);
1413 }
1414 
1415 
1416 /*
1417  * return a matching routing table entry for a given fcip instance
1418  */
1419 struct fcip_routing_table *
1420 fcip_lookup_rtable(struct fcip *fptr, la_wwn_t *wwn, int matchflag)
1421 {
1422 	struct fcip_routing_table	*frp = NULL;
1423 	int				hash_bucket;
1424 
1425 
1426 	FCIP_TNF_PROBE_1((fcip_lookup_rtable, "fcip io", /* CSTYLED */,
1427 		tnf_string, msg, "enter"));
1428 	FCIP_TNF_BYTE_ARRAY(fcip_lookup_rtable, "fcip io", "detail",
1429 		"rtable lookup for", wwn,
1430 		&wwn->raw_wwn, sizeof (la_wwn_t));
1431 	FCIP_TNF_PROBE_2((fcip_lookup_rtable, "fcip io", /* CSTYLED */,
1432 		tnf_string, msg, "match by",
1433 		tnf_int, matchflag, matchflag));
1434 
1435 	ASSERT(mutex_owned(&fptr->fcip_rt_mutex));
1436 
1437 	hash_bucket = FCIP_RT_HASH(wwn->raw_wwn);
1438 	frp = fptr->fcip_rtable[hash_bucket];
1439 	while (frp != NULL) {
1440 
1441 		FCIP_TNF_BYTE_ARRAY(fcip_lookup_rtable, "fcip io", "detail",
1442 			"rtable entry", nwwn,
1443 			&(frp->fcipr_nwwn.raw_wwn), sizeof (la_wwn_t));
1444 
1445 		if (fcip_wwn_compare(&frp->fcipr_pwwn, wwn, matchflag) == 0) {
1446 			break;
1447 		}
1448 
1449 		frp = frp->fcipr_next;
1450 	}
1451 	FCIP_TNF_PROBE_2((fcip_lookup_rtable, "fcip io", /* CSTYLED */,
1452 		tnf_string, msg, "lookup result",
1453 		tnf_opaque, frp, frp));
1454 	return (frp);
1455 }
1456 
1457 /*
1458  * Attach of fcip under pseudo. The actual setup of the interface
1459  * actually happens in fcip_port_attach on a callback from the
1460  * transport. The port_attach callback however can proceed only
1461  * after the devinfo for fcip has been created under pseudo
1462  */
1463 static int
1464 fcip_attach(dev_info_t *dip, ddi_attach_cmd_t cmd)
1465 {
1466 	switch ((int)cmd) {
1467 
1468 	case DDI_ATTACH: {
1469 		ASSERT(fcip_module_dip == NULL);
1470 		fcip_module_dip = dip;
1471 
1472 		/*
1473 		 * this call originates as a result of fcip's conf
1474 		 * file entry and will result in a fcip instance being
1475 		 * a child of pseudo. We should ensure here that the port
1476 		 * driver (fp) has been loaded and initted since we would
1477 		 * never get a port attach callback without fp being loaded.
1478 		 * If we are unable to succesfully load and initalize fp -
1479 		 * just fail this attach.
1480 		 */
1481 		mutex_enter(&fcip_global_mutex);
1482 
1483 		FCIP_DEBUG(FCIP_DEBUG_ATTACH,
1484 		    (CE_WARN, "global cv - signaling"));
1485 
1486 		cv_signal(&fcip_global_cv);
1487 
1488 		FCIP_DEBUG(FCIP_DEBUG_ATTACH,
1489 		    (CE_WARN, "global cv - signaled"));
1490 		mutex_exit(&fcip_global_mutex);
1491 		return (DDI_SUCCESS);
1492 	}
1493 	case DDI_RESUME:
1494 		/*
1495 		 * Resume appears trickier
1496 		 */
1497 		return (DDI_SUCCESS);
1498 	default:
1499 		return (DDI_FAILURE);
1500 	}
1501 }
1502 
1503 
1504 /*
1505  * The detach entry point to permit unloading fcip. We make sure
1506  * there are no active streams before we proceed with the detach
1507  */
1508 /* ARGSUSED */
1509 static int
1510 fcip_detach(dev_info_t *dip, ddi_detach_cmd_t cmd)
1511 {
1512 	struct fcip		*fptr;
1513 	fcip_port_info_t	*fport;
1514 	int			detached;
1515 
1516 	switch (cmd) {
1517 	case DDI_DETACH: {
1518 		/*
1519 		 * If we got here, any active streams should have been
1520 		 * unplumbed but check anyway
1521 		 */
1522 		mutex_enter(&fcip_global_mutex);
1523 		if (fcipstrup != NULL) {
1524 			mutex_exit(&fcip_global_mutex);
1525 			return (DDI_FAILURE);
1526 		}
1527 
1528 		if (fcip_port_head != NULL) {
1529 			/*
1530 			 * Check to see if we have unattached/unbound
1531 			 * ports. If all the ports are unattached/unbound go
1532 			 * ahead and unregister with the transport
1533 			 */
1534 			fport = fcip_port_head;
1535 			while (fport != NULL) {
1536 				fptr = fport->fcipp_fcip;
1537 				if (fptr == NULL) {
1538 					continue;
1539 				}
1540 				mutex_enter(&fptr->fcip_mutex);
1541 				fptr->fcip_flags |= FCIP_DETACHING;
1542 				if (fptr->fcip_ipq ||
1543 				    fptr->fcip_flags & (FCIP_IN_TIMEOUT |
1544 				    FCIP_IN_CALLBACK | FCIP_ATTACHING |
1545 				    FCIP_SUSPENDED | FCIP_POWER_DOWN |
1546 				    FCIP_REG_INPROGRESS)) {
1547 					FCIP_TNF_PROBE_1((fcip_detach,
1548 					    "fcip io", /* CSTYLED */,
1549 					    tnf_string, msg,
1550 					    "fcip instance busy"));
1551 
1552 					mutex_exit(&fptr->fcip_mutex);
1553 					FCIP_DEBUG(FCIP_DEBUG_DETACH, (CE_WARN,
1554 					    "fcip instance busy"));
1555 					break;
1556 				}
1557 				/*
1558 				 * Check for any outstanding pkts. If yes
1559 				 * fail the detach
1560 				 */
1561 				mutex_enter(&fptr->fcip_dest_mutex);
1562 				if (fcip_port_get_num_pkts(fptr) > 0) {
1563 					mutex_exit(&fptr->fcip_dest_mutex);
1564 					mutex_exit(&fptr->fcip_mutex);
1565 					FCIP_DEBUG(FCIP_DEBUG_DETACH, (CE_WARN,
1566 					    "fcip instance busy - pkts "
1567 					    "pending"));
1568 					break;
1569 				}
1570 				mutex_exit(&fptr->fcip_dest_mutex);
1571 
1572 				mutex_enter(&fptr->fcip_rt_mutex);
1573 				if (fcip_plogi_in_progress(fptr)) {
1574 					mutex_exit(&fptr->fcip_rt_mutex);
1575 					mutex_exit(&fptr->fcip_mutex);
1576 					FCIP_DEBUG(FCIP_DEBUG_DETACH, (CE_WARN,
1577 					    "fcip instance busy - plogi in "
1578 					    "progress"));
1579 					break;
1580 				}
1581 				mutex_exit(&fptr->fcip_rt_mutex);
1582 
1583 				mutex_exit(&fptr->fcip_mutex);
1584 				fport = fport->fcipp_next;
1585 			}
1586 			/*
1587 			 * if fport is non NULL - we have active ports
1588 			 */
1589 			if (fport != NULL) {
1590 				/*
1591 				 * Remove the DETACHING flags on the ports
1592 				 */
1593 				fport = fcip_port_head;
1594 				while (fport != NULL) {
1595 					fptr = fport->fcipp_fcip;
1596 					mutex_enter(&fptr->fcip_mutex);
1597 					fptr->fcip_flags &= ~(FCIP_DETACHING);
1598 					mutex_exit(&fptr->fcip_mutex);
1599 					fport = fport->fcipp_next;
1600 				}
1601 				mutex_exit(&fcip_global_mutex);
1602 				return (DDI_FAILURE);
1603 			}
1604 		}
1605 
1606 		/*
1607 		 * free up all softstate structures
1608 		 */
1609 		fport = fcip_port_head;
1610 		while (fport != NULL) {
1611 			detached = 1;
1612 
1613 			fptr = fport->fcipp_fcip;
1614 			if (fptr) {
1615 				mutex_enter(&fptr->fcip_mutex);
1616 				/*
1617 				 * Check to see if somebody beat us to the
1618 				 * punch
1619 				 */
1620 				detached = fptr->fcip_flags & FCIP_DETACHED;
1621 				fptr->fcip_flags &= ~(FCIP_DETACHING);
1622 				fptr->fcip_flags |= FCIP_DETACHED;
1623 				mutex_exit(&fptr->fcip_mutex);
1624 			}
1625 
1626 			if (!detached) {
1627 				fport = fcip_softstate_free(fport);
1628 			} else {
1629 				/*
1630 				 * If the port was marked as detached
1631 				 * but it was still in the list, that
1632 				 * means another thread has marked it
1633 				 * but we got in while it released the
1634 				 * fcip_global_mutex in softstate_free.
1635 				 * Given that, we're still safe to use
1636 				 * fport->fcipp_next to find out what
1637 				 * the next port on the list is.
1638 				 */
1639 				fport = fport->fcipp_next;
1640 			}
1641 
1642 			FCIP_DEBUG(FCIP_DEBUG_DETACH,
1643 			    (CE_NOTE, "detaching port"));
1644 
1645 			FCIP_TNF_PROBE_1((fcip_detach,
1646 				"fcip io", /* CSTYLED */, tnf_string,
1647 				msg, "detaching port"));
1648 		}
1649 
1650 		/*
1651 		 * If we haven't removed all the port structures, we
1652 		 * aren't yet ready to be detached.
1653 		 */
1654 		if (fcip_port_head != NULL) {
1655 			mutex_exit(&fcip_global_mutex);
1656 			return (DDI_FAILURE);
1657 		}
1658 
1659 		fcip_num_instances = 0;
1660 		mutex_exit(&fcip_global_mutex);
1661 		fcip_module_dip = NULL;
1662 		return (DDI_SUCCESS);
1663 	}
1664 	case DDI_SUSPEND:
1665 		return (DDI_SUCCESS);
1666 	default:
1667 		return (DDI_FAILURE);
1668 	}
1669 }
1670 
1671 /*
1672  * The port_detach callback is called from the transport when a
1673  * FC port is being removed from the transport's control. This routine
1674  * provides fcip with an opportunity to cleanup all activities and
1675  * structures on the port marked for removal.
1676  */
1677 /* ARGSUSED */
1678 static int
1679 fcip_port_detach(opaque_t ulp_handle, fc_ulp_port_info_t *port_info,
1680     fc_detach_cmd_t cmd)
1681 {
1682 	int 			rval = FC_FAILURE;
1683 	fcip_port_info_t	*fport;
1684 	struct fcip		*fptr;
1685 	struct fcipstr		*strp;
1686 
1687 	switch (cmd) {
1688 	case FC_CMD_DETACH: {
1689 		mutex_enter(&fcip_global_mutex);
1690 
1691 		if (fcip_port_head == NULL) {
1692 			/*
1693 			 * we are all done but our fini has not been
1694 			 * called yet!! Let's hope we have no active
1695 			 * fcip instances here. - strange secnario but
1696 			 * no harm in having this return a success.
1697 			 */
1698 			fcip_check_remove_minor_node();
1699 
1700 			mutex_exit(&fcip_global_mutex);
1701 			return (FC_SUCCESS);
1702 		} else {
1703 			/*
1704 			 * traverse the port list
1705 			 */
1706 			fport = fcip_port_head;
1707 			while (fport != NULL) {
1708 				if (fport->fcipp_handle ==
1709 				    port_info->port_handle) {
1710 					fptr = fport->fcipp_fcip;
1711 
1712 					/*
1713 					 * Fail the port detach if there is
1714 					 * still an attached, bound stream on
1715 					 * this interface.
1716 					 */
1717 
1718 					rw_enter(&fcipstruplock, RW_READER);
1719 
1720 					for (strp = fcipstrup; strp != NULL;
1721 					    strp = strp->sl_nextp) {
1722 						if (strp->sl_fcip == fptr) {
1723 							rw_exit(&fcipstruplock);
1724 							mutex_exit(
1725 							    &fcip_global_mutex);
1726 							return (FC_FAILURE);
1727 						}
1728 					}
1729 
1730 					rw_exit(&fcipstruplock);
1731 
1732 					/*
1733 					 * fail port detach if we are in
1734 					 * the middle of a deferred port attach
1735 					 * or if the port has outstanding pkts
1736 					 */
1737 					if (fptr != NULL) {
1738 						mutex_enter(&fptr->fcip_mutex);
1739 						if (fcip_check_port_busy
1740 						    (fptr) ||
1741 						    (fptr->fcip_flags &
1742 						    FCIP_DETACHED)) {
1743 							mutex_exit(
1744 							    &fptr->fcip_mutex);
1745 							mutex_exit(
1746 							    &fcip_global_mutex);
1747 							return (FC_FAILURE);
1748 						}
1749 
1750 						fptr->fcip_flags |=
1751 						    FCIP_DETACHED;
1752 						mutex_exit(&fptr->fcip_mutex);
1753 					}
1754 					(void) fcip_softstate_free(fport);
1755 
1756 					fcip_check_remove_minor_node();
1757 					mutex_exit(&fcip_global_mutex);
1758 					return (FC_SUCCESS);
1759 				}
1760 				fport = fport->fcipp_next;
1761 			}
1762 			ASSERT(fport == NULL);
1763 		}
1764 		mutex_exit(&fcip_global_mutex);
1765 		break;
1766 	}
1767 	case FC_CMD_POWER_DOWN:
1768 	/* FALLTHROUGH */
1769 	case FC_CMD_SUSPEND:
1770 		mutex_enter(&fcip_global_mutex);
1771 		fport = fcip_port_head;
1772 		while (fport != NULL) {
1773 			if (fport->fcipp_handle == port_info->port_handle) {
1774 				break;
1775 			}
1776 			fport = fport->fcipp_next;
1777 		}
1778 		if (fport == NULL) {
1779 			mutex_exit(&fcip_global_mutex);
1780 			break;
1781 		}
1782 		rval = fcip_handle_suspend(fport, cmd);
1783 		mutex_exit(&fcip_global_mutex);
1784 		break;
1785 	default:
1786 		FCIP_DEBUG(FCIP_DEBUG_DETACH,
1787 		    (CE_WARN, "unknown port detach command!!"));
1788 		break;
1789 	}
1790 	return (rval);
1791 }
1792 
1793 
1794 /*
1795  * Returns 0 if the port is not busy, else returns non zero.
1796  */
1797 static int
1798 fcip_check_port_busy(struct fcip *fptr)
1799 {
1800 	int rval = 0, num_pkts = 0;
1801 
1802 	ASSERT(fptr != NULL);
1803 	ASSERT(MUTEX_HELD(&fptr->fcip_mutex));
1804 
1805 	mutex_enter(&fptr->fcip_dest_mutex);
1806 
1807 	if (fptr->fcip_flags & FCIP_PORT_BUSY ||
1808 	    ((num_pkts = fcip_port_get_num_pkts(fptr)) > 0) ||
1809 	    fptr->fcip_num_ipkts_pending) {
1810 		rval = 1;
1811 		FCIP_DEBUG(FCIP_DEBUG_DETACH,
1812 		    (CE_NOTE, "!fcip_check_port_busy: port is busy "
1813 		    "fcip_flags: 0x%x, num_pkts: 0x%x, ipkts_pending: 0x%lx!",
1814 		    fptr->fcip_flags, num_pkts, fptr->fcip_num_ipkts_pending));
1815 	}
1816 
1817 	mutex_exit(&fptr->fcip_dest_mutex);
1818 	return (rval);
1819 }
1820 
1821 /*
1822  * Helper routine to remove fcip's minor node
1823  * There is one minor node per system and it should be removed if there are no
1824  * other fcip instances (which has a 1:1 mapping for fp instances) present
1825  */
1826 static void
1827 fcip_check_remove_minor_node(void)
1828 {
1829 	ASSERT(MUTEX_HELD(&fcip_global_mutex));
1830 
1831 	/*
1832 	 * If there are no more fcip (fp) instances, remove the
1833 	 * minor node for fcip.
1834 	 * Reset fcip_minor_node_created to invalidate it.
1835 	 */
1836 	if (fcip_num_instances == 0 && (fcip_module_dip != NULL)) {
1837 		ddi_remove_minor_node(fcip_module_dip, NULL);
1838 		fcip_minor_node_created = 0;
1839 	}
1840 }
1841 
1842 /*
1843  * This routine permits the suspend operation during a CPR/System
1844  * power management operation. The routine basically quiesces I/Os
1845  * on all active interfaces
1846  */
1847 static int
1848 fcip_handle_suspend(fcip_port_info_t *fport, fc_detach_cmd_t cmd)
1849 {
1850 	struct fcip	*fptr = fport->fcipp_fcip;
1851 	timeout_id_t	tid;
1852 	int 		index;
1853 	int		tryagain = 0;
1854 	int		count;
1855 	struct fcipstr	*tslp;
1856 
1857 
1858 	ASSERT(fptr != NULL);
1859 	mutex_enter(&fptr->fcip_mutex);
1860 
1861 	/*
1862 	 * Fail if we are in the middle of a callback. Don't use delay during
1863 	 * suspend since clock intrs are not available so busy wait
1864 	 */
1865 	count = 0;
1866 	while (count++ < 15 &&
1867 	    ((fptr->fcip_flags & FCIP_IN_CALLBACK) ||
1868 	    (fptr->fcip_flags & FCIP_IN_TIMEOUT))) {
1869 		mutex_exit(&fptr->fcip_mutex);
1870 		drv_usecwait(1000000);
1871 		mutex_enter(&fptr->fcip_mutex);
1872 	}
1873 
1874 	if (fptr->fcip_flags & FCIP_IN_CALLBACK ||
1875 	    fptr->fcip_flags & FCIP_IN_TIMEOUT) {
1876 		mutex_exit(&fptr->fcip_mutex);
1877 		return (FC_FAILURE);
1878 	}
1879 
1880 	if (cmd == FC_CMD_POWER_DOWN) {
1881 		if (fptr->fcip_flags & FCIP_SUSPENDED) {
1882 			fptr->fcip_flags |= FCIP_POWER_DOWN;
1883 			mutex_exit(&fptr->fcip_mutex);
1884 			goto success;
1885 		} else {
1886 			fptr->fcip_flags |= FCIP_POWER_DOWN;
1887 		}
1888 	} else if (cmd == FC_CMD_SUSPEND) {
1889 		fptr->fcip_flags |= FCIP_SUSPENDED;
1890 	} else {
1891 		mutex_exit(&fptr->fcip_mutex);
1892 		return (FC_FAILURE);
1893 	}
1894 
1895 	mutex_exit(&fptr->fcip_mutex);
1896 	/*
1897 	 * If no streams are plumbed - its the easiest case - Just
1898 	 * bail out without having to do much
1899 	 */
1900 
1901 	rw_enter(&fcipstruplock, RW_READER);
1902 	for (tslp = fcipstrup; tslp; tslp = tslp->sl_nextp) {
1903 		if (tslp->sl_fcip == fptr) {
1904 			break;
1905 		}
1906 	}
1907 	rw_exit(&fcipstruplock);
1908 
1909 	/*
1910 	 * No active streams on this port
1911 	 */
1912 	if (tslp == NULL) {
1913 		goto success;
1914 	}
1915 
1916 	/*
1917 	 * Walk through each Routing table structure and check if
1918 	 * the destination table has any outstanding commands. If yes
1919 	 * wait for the commands to drain. Since we go through each
1920 	 * routing table entry in succession, it may be wise to wait
1921 	 * only a few seconds for each entry.
1922 	 */
1923 	mutex_enter(&fptr->fcip_rt_mutex);
1924 	while (!tryagain) {
1925 
1926 		tryagain = 0;
1927 		for (index = 0; index < FCIP_RT_HASH_ELEMS; index++) {
1928 			struct fcip_routing_table 	*frp;
1929 			struct fcip_dest 		*fdestp;
1930 			la_wwn_t			*pwwn;
1931 			int				hash_bucket;
1932 
1933 			frp = fptr->fcip_rtable[index];
1934 			while (frp) {
1935 				/*
1936 				 * Mark the routing table as SUSPENDED. Even
1937 				 * mark the broadcast entry SUSPENDED to
1938 				 * prevent any ARP or other broadcasts. We
1939 				 * can reset the state of the broadcast
1940 				 * RTE when we resume.
1941 				 */
1942 				frp->fcipr_state = FCIP_RT_SUSPENDED;
1943 				pwwn = &frp->fcipr_pwwn;
1944 
1945 				/*
1946 				 * Get hold of destination pointer
1947 				 */
1948 				mutex_enter(&fptr->fcip_dest_mutex);
1949 
1950 				hash_bucket = FCIP_DEST_HASH(pwwn->raw_wwn);
1951 				ASSERT(hash_bucket < FCIP_DEST_HASH_ELEMS);
1952 
1953 				fdestp = fptr->fcip_dest[hash_bucket];
1954 				while (fdestp != NULL) {
1955 					mutex_enter(&fdestp->fcipd_mutex);
1956 					if (fdestp->fcipd_rtable) {
1957 						if (fcip_wwn_compare(pwwn,
1958 						    &fdestp->fcipd_pwwn,
1959 						    FCIP_COMPARE_PWWN) == 0) {
1960 							mutex_exit(
1961 							&fdestp->fcipd_mutex);
1962 							break;
1963 						}
1964 					}
1965 					mutex_exit(&fdestp->fcipd_mutex);
1966 					fdestp = fdestp->fcipd_next;
1967 				}
1968 
1969 				mutex_exit(&fptr->fcip_dest_mutex);
1970 				if (fdestp == NULL) {
1971 					frp = frp->fcipr_next;
1972 					continue;
1973 				}
1974 
1975 				/*
1976 				 * Wait for fcip_wait_cmds seconds for
1977 				 * the commands to drain.
1978 				 */
1979 				count = 0;
1980 				mutex_enter(&fdestp->fcipd_mutex);
1981 				while (fdestp->fcipd_ncmds &&
1982 				    count < fcip_wait_cmds) {
1983 					mutex_exit(&fdestp->fcipd_mutex);
1984 					mutex_exit(&fptr->fcip_rt_mutex);
1985 					drv_usecwait(1000000);
1986 					mutex_enter(&fptr->fcip_rt_mutex);
1987 					mutex_enter(&fdestp->fcipd_mutex);
1988 					count++;
1989 				}
1990 				/*
1991 				 * Check if we were able to drain all cmds
1992 				 * successfully. Else continue with other
1993 				 * ports and try during the second pass
1994 				 */
1995 				if (fdestp->fcipd_ncmds) {
1996 					tryagain++;
1997 				}
1998 				mutex_exit(&fdestp->fcipd_mutex);
1999 
2000 				frp = frp->fcipr_next;
2001 			}
2002 		}
2003 		if (tryagain == 0) {
2004 			break;
2005 		}
2006 	}
2007 	mutex_exit(&fptr->fcip_rt_mutex);
2008 
2009 	if (tryagain) {
2010 		mutex_enter(&fptr->fcip_mutex);
2011 		fptr->fcip_flags &= ~(FCIP_SUSPENDED | FCIP_POWER_DOWN);
2012 		mutex_exit(&fptr->fcip_mutex);
2013 		return (FC_FAILURE);
2014 	}
2015 
2016 success:
2017 	mutex_enter(&fptr->fcip_mutex);
2018 	tid = fptr->fcip_timeout_id;
2019 	fptr->fcip_timeout_id = NULL;
2020 	mutex_exit(&fptr->fcip_mutex);
2021 
2022 	(void) untimeout(tid);
2023 
2024 	return (FC_SUCCESS);
2025 }
2026 
2027 /*
2028  * the getinfo(9E) entry point
2029  */
2030 /* ARGSUSED */
2031 static int
2032 fcip_getinfo(dev_info_t *dip, ddi_info_cmd_t cmd, void *arg, void **result)
2033 {
2034 	int rval = DDI_FAILURE;
2035 
2036 	switch (cmd) {
2037 	case DDI_INFO_DEVT2DEVINFO:
2038 		*result = fcip_module_dip;
2039 		if (*result)
2040 			rval = DDI_SUCCESS;
2041 		break;
2042 
2043 	case DDI_INFO_DEVT2INSTANCE:
2044 		*result = (void *)0;
2045 		rval = DDI_SUCCESS;
2046 		break;
2047 	default:
2048 		break;
2049 	}
2050 
2051 	return (rval);
2052 }
2053 
2054 /*
2055  * called from fcip_attach to initialize kstats for the link
2056  */
2057 /* ARGSUSED */
2058 static void
2059 fcip_kstat_init(struct fcip *fptr)
2060 {
2061 	int instance;
2062 	char buf[16];
2063 	struct fcipstat	*fcipstatp;
2064 
2065 	ASSERT(mutex_owned(&fptr->fcip_mutex));
2066 
2067 	instance = ddi_get_instance(fptr->fcip_dip);
2068 	(void) sprintf(buf, "fcip%d", instance);
2069 
2070 #ifdef	kstat
2071 	fptr->fcip_kstatp = kstat_create("fcip", instance, buf, "net",
2072 	    KSTAT_TYPE_NAMED,
2073 	    (sizeof (struct fcipstat)/ sizeof (kstat_named_t)),
2074 	    KSTAT_FLAG_PERSISTENT);
2075 #else
2076 	fptr->fcip_kstatp = kstat_create("fcip", instance, buf, "net",
2077 	    KSTAT_TYPE_NAMED,
2078 	    (sizeof (struct fcipstat)/ sizeof (kstat_named_t)), 0);
2079 #endif
2080 	if (fptr->fcip_kstatp == NULL) {
2081 		FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_WARN, "kstat created failed"));
2082 		return;
2083 	}
2084 
2085 	fcipstatp = (struct  fcipstat *)fptr->fcip_kstatp->ks_data;
2086 	kstat_named_init(&fcipstatp->fcips_ipackets,	"ipackets",
2087 		KSTAT_DATA_ULONG);
2088 	kstat_named_init(&fcipstatp->fcips_ierrors,	"ierrors",
2089 		KSTAT_DATA_ULONG);
2090 	kstat_named_init(&fcipstatp->fcips_opackets,	"opackets",
2091 		KSTAT_DATA_ULONG);
2092 	kstat_named_init(&fcipstatp->fcips_oerrors,	"oerrors",
2093 		KSTAT_DATA_ULONG);
2094 	kstat_named_init(&fcipstatp->fcips_collisions,	"collisions",
2095 		KSTAT_DATA_ULONG);
2096 	kstat_named_init(&fcipstatp->fcips_nocanput,	"nocanput",
2097 		KSTAT_DATA_ULONG);
2098 	kstat_named_init(&fcipstatp->fcips_allocbfail,	"allocbfail",
2099 		KSTAT_DATA_ULONG);
2100 
2101 	kstat_named_init(&fcipstatp->fcips_defer, "defer",
2102 		KSTAT_DATA_ULONG);
2103 	kstat_named_init(&fcipstatp->fcips_fram, "fram",
2104 		KSTAT_DATA_ULONG);
2105 	kstat_named_init(&fcipstatp->fcips_crc, "crc",
2106 		KSTAT_DATA_ULONG);
2107 	kstat_named_init(&fcipstatp->fcips_oflo, "oflo",
2108 		KSTAT_DATA_ULONG);
2109 	kstat_named_init(&fcipstatp->fcips_uflo, "uflo",
2110 		KSTAT_DATA_ULONG);
2111 	kstat_named_init(&fcipstatp->fcips_missed, "missed",
2112 		KSTAT_DATA_ULONG);
2113 	kstat_named_init(&fcipstatp->fcips_tlcol, "tlcol",
2114 		KSTAT_DATA_ULONG);
2115 	kstat_named_init(&fcipstatp->fcips_trtry, "trtry",
2116 		KSTAT_DATA_ULONG);
2117 	kstat_named_init(&fcipstatp->fcips_tnocar, "tnocar",
2118 		KSTAT_DATA_ULONG);
2119 	kstat_named_init(&fcipstatp->fcips_inits, "inits",
2120 		KSTAT_DATA_ULONG);
2121 	kstat_named_init(&fcipstatp->fcips_notbufs, "notbufs",
2122 		KSTAT_DATA_ULONG);
2123 	kstat_named_init(&fcipstatp->fcips_norbufs, "norbufs",
2124 		KSTAT_DATA_ULONG);
2125 	kstat_named_init(&fcipstatp->fcips_allocbfail, "allocbfail",
2126 		KSTAT_DATA_ULONG);
2127 
2128 	/*
2129 	 * required by kstat for MIB II objects(RFC 1213)
2130 	 */
2131 	kstat_named_init(&fcipstatp->fcips_rcvbytes, "fcips_rcvbytes",
2132 		KSTAT_DATA_ULONG);	/* # octets received */
2133 					/* MIB - ifInOctets */
2134 	kstat_named_init(&fcipstatp->fcips_xmtbytes, "fcips_xmtbytes",
2135 		KSTAT_DATA_ULONG);	/* # octets xmitted */
2136 					/* MIB - ifOutOctets */
2137 	kstat_named_init(&fcipstatp->fcips_multircv,	"fcips_multircv",
2138 		KSTAT_DATA_ULONG);	/* # multicast packets */
2139 					/* delivered to upper layer */
2140 					/* MIB - ifInNUcastPkts */
2141 	kstat_named_init(&fcipstatp->fcips_multixmt,	"fcips_multixmt",
2142 		KSTAT_DATA_ULONG);	/* # multicast packets */
2143 					/* requested to be sent */
2144 					/* MIB - ifOutNUcastPkts */
2145 	kstat_named_init(&fcipstatp->fcips_brdcstrcv, "fcips_brdcstrcv",
2146 		KSTAT_DATA_ULONG); /* # broadcast packets */
2147 					/* delivered to upper layer */
2148 					/* MIB - ifInNUcastPkts */
2149 	kstat_named_init(&fcipstatp->fcips_brdcstxmt, "fcips_brdcstxmt",
2150 		KSTAT_DATA_ULONG);	/* # broadcast packets */
2151 					/* requested to be sent */
2152 					/* MIB - ifOutNUcastPkts */
2153 	kstat_named_init(&fcipstatp->fcips_norcvbuf,	"fcips_norcvbuf",
2154 		KSTAT_DATA_ULONG);	/* # rcv packets discarded */
2155 					/* MIB - ifInDiscards */
2156 	kstat_named_init(&fcipstatp->fcips_noxmtbuf,	"fcips_noxmtbuf",
2157 		KSTAT_DATA_ULONG);	/* # xmt packets discarded */
2158 
2159 	fptr->fcip_kstatp->ks_update = fcip_stat_update;
2160 	fptr->fcip_kstatp->ks_private = (void *) fptr;
2161 	kstat_install(fptr->fcip_kstatp);
2162 }
2163 
2164 /*
2165  * Update the defined kstats for netstat et al to use
2166  */
2167 /* ARGSUSED */
2168 static int
2169 fcip_stat_update(kstat_t *fcip_statp, int val)
2170 {
2171 	struct fcipstat	*fcipstatp;
2172 	struct fcip	*fptr;
2173 
2174 	fptr = (struct fcip *)fcip_statp->ks_private;
2175 	fcipstatp = (struct fcipstat *)fcip_statp->ks_data;
2176 
2177 	if (val == KSTAT_WRITE) {
2178 		fptr->fcip_ipackets	= fcipstatp->fcips_ipackets.value.ul;
2179 		fptr->fcip_ierrors	= fcipstatp->fcips_ierrors.value.ul;
2180 		fptr->fcip_opackets	= fcipstatp->fcips_opackets.value.ul;
2181 		fptr->fcip_oerrors	= fcipstatp->fcips_oerrors.value.ul;
2182 		fptr->fcip_collisions	= fcipstatp->fcips_collisions.value.ul;
2183 		fptr->fcip_defer	= fcipstatp->fcips_defer.value.ul;
2184 		fptr->fcip_fram	= fcipstatp->fcips_fram.value.ul;
2185 		fptr->fcip_crc	= fcipstatp->fcips_crc.value.ul;
2186 		fptr->fcip_oflo	= fcipstatp->fcips_oflo.value.ul;
2187 		fptr->fcip_uflo	= fcipstatp->fcips_uflo.value.ul;
2188 		fptr->fcip_missed	= fcipstatp->fcips_missed.value.ul;
2189 		fptr->fcip_tlcol	= fcipstatp->fcips_tlcol.value.ul;
2190 		fptr->fcip_trtry	= fcipstatp->fcips_trtry.value.ul;
2191 		fptr->fcip_tnocar	= fcipstatp->fcips_tnocar.value.ul;
2192 		fptr->fcip_inits	= fcipstatp->fcips_inits.value.ul;
2193 		fptr->fcip_notbufs	= fcipstatp->fcips_notbufs.value.ul;
2194 		fptr->fcip_norbufs	= fcipstatp->fcips_norbufs.value.ul;
2195 		fptr->fcip_nocanput	= fcipstatp->fcips_nocanput.value.ul;
2196 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2197 		fptr->fcip_rcvbytes	= fcipstatp->fcips_rcvbytes.value.ul;
2198 		fptr->fcip_xmtbytes	= fcipstatp->fcips_xmtbytes.value.ul;
2199 		fptr->fcip_multircv	= fcipstatp->fcips_multircv.value.ul;
2200 		fptr->fcip_multixmt	= fcipstatp->fcips_multixmt.value.ul;
2201 		fptr->fcip_brdcstrcv	= fcipstatp->fcips_brdcstrcv.value.ul;
2202 		fptr->fcip_norcvbuf	= fcipstatp->fcips_norcvbuf.value.ul;
2203 		fptr->fcip_noxmtbuf	= fcipstatp->fcips_noxmtbuf.value.ul;
2204 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2205 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2206 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2207 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2208 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2209 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2210 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2211 		fptr->fcip_allocbfail	= fcipstatp->fcips_allocbfail.value.ul;
2212 
2213 	} else {
2214 		fcipstatp->fcips_ipackets.value.ul	= fptr->fcip_ipackets;
2215 		fcipstatp->fcips_ierrors.value.ul	= fptr->fcip_ierrors;
2216 		fcipstatp->fcips_opackets.value.ul	= fptr->fcip_opackets;
2217 		fcipstatp->fcips_oerrors.value.ul	= fptr->fcip_oerrors;
2218 		fcipstatp->fcips_collisions.value.ul	= fptr->fcip_collisions;
2219 		fcipstatp->fcips_nocanput.value.ul	= fptr->fcip_nocanput;
2220 		fcipstatp->fcips_allocbfail.value.ul	= fptr->fcip_allocbfail;
2221 		fcipstatp->fcips_defer.value.ul	= fptr->fcip_defer;
2222 		fcipstatp->fcips_fram.value.ul	= fptr->fcip_fram;
2223 		fcipstatp->fcips_crc.value.ul	= fptr->fcip_crc;
2224 		fcipstatp->fcips_oflo.value.ul	= fptr->fcip_oflo;
2225 		fcipstatp->fcips_uflo.value.ul	= fptr->fcip_uflo;
2226 		fcipstatp->fcips_missed.value.ul	= fptr->fcip_missed;
2227 		fcipstatp->fcips_tlcol.value.ul	= fptr->fcip_tlcol;
2228 		fcipstatp->fcips_trtry.value.ul	= fptr->fcip_trtry;
2229 		fcipstatp->fcips_tnocar.value.ul	= fptr->fcip_tnocar;
2230 		fcipstatp->fcips_inits.value.ul	= fptr->fcip_inits;
2231 		fcipstatp->fcips_norbufs.value.ul	= fptr->fcip_norbufs;
2232 		fcipstatp->fcips_notbufs.value.ul	= fptr->fcip_notbufs;
2233 		fcipstatp->fcips_rcvbytes.value.ul	= fptr->fcip_rcvbytes;
2234 		fcipstatp->fcips_xmtbytes.value.ul	= fptr->fcip_xmtbytes;
2235 		fcipstatp->fcips_multircv.value.ul	= fptr->fcip_multircv;
2236 		fcipstatp->fcips_multixmt.value.ul	= fptr->fcip_multixmt;
2237 		fcipstatp->fcips_brdcstrcv.value.ul	= fptr->fcip_brdcstrcv;
2238 		fcipstatp->fcips_brdcstxmt.value.ul	= fptr->fcip_brdcstxmt;
2239 		fcipstatp->fcips_norcvbuf.value.ul	= fptr->fcip_norcvbuf;
2240 		fcipstatp->fcips_noxmtbuf.value.ul	= fptr->fcip_noxmtbuf;
2241 
2242 	}
2243 	return (0);
2244 }
2245 
2246 
2247 /*
2248  * fcip_statec_cb: handles all required state change callback notifications
2249  * it receives from the transport
2250  */
2251 /* ARGSUSED */
2252 static void
2253 fcip_statec_cb(opaque_t ulp_handle, opaque_t phandle,
2254     uint32_t port_state, uint32_t port_top, fc_portmap_t changelist[],
2255     uint32_t listlen, uint32_t sid)
2256 {
2257 	fcip_port_info_t	*fport;
2258 	struct fcip 		*fptr;
2259 	struct fcipstr		*slp;
2260 	queue_t			*wrq;
2261 	int			instance;
2262 	int 			index;
2263 	struct fcip_routing_table 	*frtp;
2264 
2265 	fport = fcip_get_port(phandle);
2266 
2267 	if (fport == NULL) {
2268 		return;
2269 	}
2270 
2271 	fptr = fport->fcipp_fcip;
2272 	ASSERT(fptr != NULL);
2273 
2274 	if (fptr == NULL) {
2275 		return;
2276 	}
2277 
2278 	instance = ddi_get_instance(fport->fcipp_dip);
2279 
2280 	FCIP_TNF_PROBE_4((fcip_statec_cb, "fcip io", /* CSTYLED */,
2281 		tnf_string, msg, "state change callback",
2282 		tnf_uint, instance, instance,
2283 		tnf_uint, S_ID, sid,
2284 		tnf_int, count, listlen));
2285 	FCIP_DEBUG(FCIP_DEBUG_ELS,
2286 	    (CE_NOTE, "fcip%d, state change callback: state:0x%x, "
2287 	    "S_ID:0x%x, count:0x%x", instance, port_state, sid, listlen));
2288 
2289 	mutex_enter(&fptr->fcip_mutex);
2290 
2291 	if ((fptr->fcip_flags & (FCIP_DETACHING | FCIP_DETACHED)) ||
2292 	    (fptr->fcip_flags & (FCIP_SUSPENDED | FCIP_POWER_DOWN))) {
2293 		mutex_exit(&fptr->fcip_mutex);
2294 		return;
2295 	}
2296 
2297 	/*
2298 	 * set fcip flags to indicate we are in the middle of a
2299 	 * state change callback so we can wait till the statechange
2300 	 * is handled before succeeding/failing the SUSPEND/POWER DOWN.
2301 	 */
2302 	fptr->fcip_flags |= FCIP_IN_SC_CB;
2303 
2304 	fport->fcipp_pstate = port_state;
2305 
2306 	/*
2307 	 * Check if topology changed. If Yes - Modify the broadcast
2308 	 * RTE entries to understand the new broadcast D_IDs
2309 	 */
2310 	if (fport->fcipp_topology != port_top &&
2311 	    (port_top != FC_TOP_UNKNOWN)) {
2312 		/* REMOVE later */
2313 		FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_NOTE,
2314 		    "topology changed: Old topology: 0x%x New topology 0x%x",
2315 		    fport->fcipp_topology, port_top));
2316 		/*
2317 		 * If topology changed - attempt a rediscovery of
2318 		 * devices. Helps specially in Fabric/Public loops
2319 		 * and if on_demand_node_creation is disabled
2320 		 */
2321 		fport->fcipp_topology = port_top;
2322 		fcip_handle_topology(fptr);
2323 	}
2324 
2325 	mutex_exit(&fptr->fcip_mutex);
2326 
2327 	switch (FC_PORT_STATE_MASK(port_state)) {
2328 	case FC_STATE_ONLINE:
2329 	/* FALLTHROUGH */
2330 	case FC_STATE_LIP:
2331 	/* FALLTHROUGH */
2332 	case FC_STATE_LIP_LBIT_SET:
2333 
2334 		/*
2335 		 * nothing to do here actually other than if we
2336 		 * were actually logged onto a port in the devlist
2337 		 * (which indicates active communication between
2338 		 * the host port and the port in the changelist).
2339 		 * If however we are in a private loop or point to
2340 		 * point mode, we need to check for any IP capable
2341 		 * ports and update our routing table.
2342 		 */
2343 		switch (port_top) {
2344 		case FC_TOP_FABRIC:
2345 			/*
2346 			 * This indicates a fabric port with a NameServer.
2347 			 * Check the devlist to see if we are in active
2348 			 * communication with a port on the devlist.
2349 			 */
2350 			FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_NOTE,
2351 			    "Statec_cb: fabric topology"));
2352 			fcip_rt_update(fptr, changelist, listlen);
2353 			break;
2354 		case FC_TOP_NO_NS:
2355 			/*
2356 			 * No nameserver - so treat it like a Private loop
2357 			 * or point to point topology and get a map of
2358 			 * devices on the link and get IP capable ports to
2359 			 * to update the routing table.
2360 			 */
2361 			FCIP_DEBUG(FCIP_DEBUG_ELS,
2362 			    (CE_NOTE, "Statec_cb: NO_NS topology"));
2363 		/* FALLTHROUGH */
2364 		case FC_TOP_PRIVATE_LOOP:
2365 			FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_NOTE,
2366 			    "Statec_cb: Pvt_Loop topology"));
2367 		/* FALLTHROUGH */
2368 		case FC_TOP_PT_PT:
2369 			/*
2370 			 * call get_port_map() and update routing table
2371 			 */
2372 			fcip_rt_update(fptr, changelist, listlen);
2373 			break;
2374 		default:
2375 			FCIP_DEBUG(FCIP_DEBUG_ELS,
2376 			    (CE_NOTE, "Statec_cb: Unknown topology"));
2377 		}
2378 
2379 		/*
2380 		 * We should now enable the Queues and permit I/Os
2381 		 * to flow through downstream. The update of routing
2382 		 * table should have flushed out any port entries that
2383 		 * don't exist or are not available after the state change
2384 		 */
2385 		mutex_enter(&fptr->fcip_mutex);
2386 		fptr->fcip_port_state = FCIP_PORT_ONLINE;
2387 		if (fptr->fcip_flags & FCIP_LINK_DOWN) {
2388 			fptr->fcip_flags &= ~FCIP_LINK_DOWN;
2389 		}
2390 		mutex_exit(&fptr->fcip_mutex);
2391 
2392 		/*
2393 		 * Enable write queues
2394 		 */
2395 		rw_enter(&fcipstruplock, RW_READER);
2396 		for (slp = fcipstrup; slp != NULL; slp = slp->sl_nextp) {
2397 			if (slp && slp->sl_fcip == fptr) {
2398 				wrq = WR(slp->sl_rq);
2399 				if (wrq->q_flag & QFULL) {
2400 					qenable(wrq);
2401 				}
2402 			}
2403 		}
2404 		rw_exit(&fcipstruplock);
2405 		break;
2406 	case FC_STATE_OFFLINE:
2407 		/*
2408 		 * mark the port_state OFFLINE and wait for it to
2409 		 * become online. Any new messages in this state will
2410 		 * simply be queued back up. If the port does not
2411 		 * come online in a short while, we can begin failing
2412 		 * messages and flush the routing table
2413 		 */
2414 		mutex_enter(&fptr->fcip_mutex);
2415 		fptr->fcip_mark_offline = fptr->fcip_timeout_ticks +
2416 		    FCIP_OFFLINE_TIMEOUT;
2417 		fptr->fcip_port_state = FCIP_PORT_OFFLINE;
2418 		mutex_exit(&fptr->fcip_mutex);
2419 
2420 		/*
2421 		 * Mark all Routing table entries as invalid to prevent
2422 		 * any commands from trickling through to ports that
2423 		 * have disappeared from under us
2424 		 */
2425 		mutex_enter(&fptr->fcip_rt_mutex);
2426 		for (index = 0; index < FCIP_RT_HASH_ELEMS; index++) {
2427 			frtp = fptr->fcip_rtable[index];
2428 			while (frtp) {
2429 				frtp->fcipr_state = PORT_DEVICE_INVALID;
2430 				frtp = frtp->fcipr_next;
2431 			}
2432 		}
2433 		mutex_exit(&fptr->fcip_rt_mutex);
2434 
2435 		break;
2436 
2437 	case FC_STATE_RESET_REQUESTED:
2438 		/*
2439 		 * Release all Unsolicited buffers back to transport/FCA.
2440 		 * This also means the port state is marked offline - so
2441 		 * we may have to do what OFFLINE state requires us to do.
2442 		 * Care must be taken to wait for any active unsolicited
2443 		 * buffer with the other Streams modules - so wait for
2444 		 * a freeb if the unsolicited buffer is passed back all
2445 		 * the way upstream.
2446 		 */
2447 		mutex_enter(&fptr->fcip_mutex);
2448 
2449 #ifdef FCIP_ESBALLOC
2450 		while (fptr->fcip_ub_upstream) {
2451 			cv_wait(&fptr->fcip_ub_cv, &fptr->fcip_mutex);
2452 		}
2453 #endif	/* FCIP_ESBALLOC */
2454 
2455 		fptr->fcip_mark_offline = fptr->fcip_timeout_ticks +
2456 		    FCIP_OFFLINE_TIMEOUT;
2457 		fptr->fcip_port_state = FCIP_PORT_OFFLINE;
2458 		mutex_exit(&fptr->fcip_mutex);
2459 		break;
2460 
2461 	case FC_STATE_DEVICE_CHANGE:
2462 		if (listlen) {
2463 			fcip_rt_update(fptr, changelist, listlen);
2464 		}
2465 		break;
2466 	case FC_STATE_RESET:
2467 		/*
2468 		 * Not much to do I guess - wait for port to become
2469 		 * ONLINE. If the port doesn't become online in a short
2470 		 * while, the upper layers abort any request themselves.
2471 		 * We can just putback the messages in the streams queues
2472 		 * if the link is offline
2473 		 */
2474 		break;
2475 	}
2476 	mutex_enter(&fptr->fcip_mutex);
2477 	fptr->fcip_flags &= ~(FCIP_IN_SC_CB);
2478 	mutex_exit(&fptr->fcip_mutex);
2479 }
2480 
2481 /*
2482  * Given a port handle, return the fcip_port_info structure corresponding
2483  * to that port handle. The transport allocates and communicates with
2484  * ULPs using port handles
2485  */
2486 static fcip_port_info_t *
2487 fcip_get_port(opaque_t phandle)
2488 {
2489 	fcip_port_info_t *fport;
2490 
2491 	ASSERT(phandle != NULL);
2492 
2493 	mutex_enter(&fcip_global_mutex);
2494 	fport = fcip_port_head;
2495 
2496 	while (fport != NULL) {
2497 		if (fport->fcipp_handle == phandle) {
2498 			/* found */
2499 			break;
2500 		}
2501 		fport = fport->fcipp_next;
2502 	}
2503 
2504 	mutex_exit(&fcip_global_mutex);
2505 
2506 	return (fport);
2507 }
2508 
2509 /*
2510  * Handle inbound ELS requests received by the transport. We are only
2511  * intereseted in FARP/InARP mostly.
2512  */
2513 /* ARGSUSED */
2514 static int
2515 fcip_els_cb(opaque_t ulp_handle, opaque_t phandle,
2516     fc_unsol_buf_t *buf, uint32_t claimed)
2517 {
2518 	fcip_port_info_t	*fport;
2519 	struct fcip 		*fptr;
2520 	int			instance;
2521 	uchar_t			r_ctl;
2522 	uchar_t			ls_code;
2523 	la_els_farp_t		farp_cmd;
2524 	la_els_farp_t		*fcmd;
2525 	int			rval = FC_UNCLAIMED;
2526 
2527 	fport = fcip_get_port(phandle);
2528 	if (fport == NULL) {
2529 		return (FC_UNCLAIMED);
2530 	}
2531 
2532 	fptr = fport->fcipp_fcip;
2533 	ASSERT(fptr != NULL);
2534 	if (fptr == NULL) {
2535 		return (FC_UNCLAIMED);
2536 	}
2537 
2538 	instance = ddi_get_instance(fport->fcipp_dip);
2539 
2540 	mutex_enter(&fptr->fcip_mutex);
2541 	if ((fptr->fcip_flags & (FCIP_DETACHING | FCIP_DETACHED)) ||
2542 	    (fptr->fcip_flags & (FCIP_SUSPENDED | FCIP_POWER_DOWN))) {
2543 		mutex_exit(&fptr->fcip_mutex);
2544 		return (FC_UNCLAIMED);
2545 	}
2546 
2547 	/*
2548 	 * set fcip flags to indicate we are in the middle of a
2549 	 * ELS callback so we can wait till the statechange
2550 	 * is handled before succeeding/failing the SUSPEND/POWER DOWN.
2551 	 */
2552 	fptr->fcip_flags |= FCIP_IN_ELS_CB;
2553 	mutex_exit(&fptr->fcip_mutex);
2554 
2555 	FCIP_TNF_PROBE_2((fcip_els_cb, "fcip io", /* CSTYLED */,
2556 		tnf_string, msg, "ELS callback",
2557 		tnf_uint, instance, instance));
2558 
2559 	FCIP_DEBUG(FCIP_DEBUG_ELS,
2560 	    (CE_NOTE, "fcip%d, ELS callback , ", instance));
2561 
2562 	r_ctl = buf->ub_frame.r_ctl;
2563 	switch (r_ctl & R_CTL_ROUTING) {
2564 	case R_CTL_EXTENDED_SVC:
2565 		if (r_ctl == R_CTL_ELS_REQ) {
2566 			ls_code = buf->ub_buffer[0];
2567 			if (ls_code == LA_ELS_FARP_REQ) {
2568 				/*
2569 				 * Inbound FARP broadcast request
2570 				 */
2571 				if (buf->ub_bufsize != sizeof (la_els_farp_t)) {
2572 					FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_WARN,
2573 					    "Invalid FARP req buffer size "
2574 					    "expected 0x%lx, got 0x%x",
2575 					    (long)(sizeof (la_els_farp_t)),
2576 					    buf->ub_bufsize));
2577 					rval = FC_UNCLAIMED;
2578 					goto els_cb_done;
2579 				}
2580 				fcmd = (la_els_farp_t *)buf;
2581 				if (fcip_wwn_compare(&fcmd->resp_nwwn,
2582 				    &fport->fcipp_nwwn,
2583 				    FCIP_COMPARE_NWWN) != 0) {
2584 					rval = FC_UNCLAIMED;
2585 					goto els_cb_done;
2586 				}
2587 				/*
2588 				 * copy the FARP request and release the
2589 				 * unsolicited buffer
2590 				 */
2591 				fcmd = &farp_cmd;
2592 				bcopy((void *)buf, (void *)fcmd,
2593 				    sizeof (la_els_farp_t));
2594 				(void) fc_ulp_ubrelease(fport->fcipp_handle, 1,
2595 				    &buf->ub_token);
2596 
2597 				if (fcip_farp_supported &&
2598 				    fcip_handle_farp_request(fptr, fcmd) ==
2599 				    FC_SUCCESS) {
2600 					/*
2601 					 * We successfully sent out a FARP
2602 					 * reply to the requesting port
2603 					 */
2604 					rval = FC_SUCCESS;
2605 					goto els_cb_done;
2606 				} else {
2607 					rval = FC_UNCLAIMED;
2608 					goto els_cb_done;
2609 				}
2610 			}
2611 		} else if (r_ctl == R_CTL_ELS_RSP) {
2612 			ls_code = buf->ub_buffer[0];
2613 			if (ls_code == LA_ELS_FARP_REPLY) {
2614 				/*
2615 				 * We received a REPLY to our FARP request
2616 				 */
2617 				if (buf->ub_bufsize != sizeof (la_els_farp_t)) {
2618 					FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_WARN,
2619 					    "Invalid FARP req buffer size "
2620 					    "expected 0x%lx, got 0x%x",
2621 					    (long)(sizeof (la_els_farp_t)),
2622 					    buf->ub_bufsize));
2623 					rval = FC_UNCLAIMED;
2624 					goto els_cb_done;
2625 				}
2626 				fcmd = &farp_cmd;
2627 				bcopy((void *)buf, (void *)fcmd,
2628 				    sizeof (la_els_farp_t));
2629 				(void) fc_ulp_ubrelease(fport->fcipp_handle, 1,
2630 				    &buf->ub_token);
2631 				if (fcip_farp_supported &&
2632 				    fcip_handle_farp_response(fptr, fcmd) ==
2633 				    FC_SUCCESS) {
2634 					FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_NOTE,
2635 					    "Successfully recevied a FARP "
2636 					    "response"));
2637 					mutex_enter(&fptr->fcip_mutex);
2638 					fptr->fcip_farp_rsp_flag = 1;
2639 					cv_signal(&fptr->fcip_farp_cv);
2640 					mutex_exit(&fptr->fcip_mutex);
2641 					rval = FC_SUCCESS;
2642 					goto els_cb_done;
2643 				} else {
2644 					FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_WARN,
2645 					    "Unable to handle a FARP response "
2646 					    "receive"));
2647 					rval = FC_UNCLAIMED;
2648 					goto els_cb_done;
2649 				}
2650 			}
2651 		}
2652 		break;
2653 	default:
2654 		break;
2655 	}
2656 els_cb_done:
2657 	mutex_enter(&fptr->fcip_mutex);
2658 	fptr->fcip_flags &= ~(FCIP_IN_ELS_CB);
2659 	mutex_exit(&fptr->fcip_mutex);
2660 	return (rval);
2661 }
2662 
2663 
2664 /*
2665  * Handle inbound FARP requests
2666  */
2667 static int
2668 fcip_handle_farp_request(struct fcip *fptr, la_els_farp_t *fcmd)
2669 {
2670 	fcip_pkt_t		*fcip_pkt;
2671 	fc_packet_t		*fc_pkt;
2672 	fcip_port_info_t	*fport = fptr->fcip_port_info;
2673 	int			rval = FC_FAILURE;
2674 	opaque_t		fca_dev;
2675 	fc_portmap_t 		map;
2676 	struct fcip_routing_table *frp;
2677 	struct fcip_dest *fdestp;
2678 
2679 	/*
2680 	 * Add an entry for the remote port into our routing and destination
2681 	 * tables.
2682 	 */
2683 	map.map_did = fcmd->req_id;
2684 	map.map_hard_addr.hard_addr = fcmd->req_id.port_id;
2685 	map.map_state = PORT_DEVICE_VALID;
2686 	map.map_type = PORT_DEVICE_NEW;
2687 	map.map_flags = 0;
2688 	map.map_pd = NULL;
2689 	bcopy((void *)&fcmd->req_pwwn, (void *)&map.map_pwwn,
2690 	    sizeof (la_wwn_t));
2691 	bcopy((void *)&fcmd->req_nwwn, (void *)&map.map_nwwn,
2692 	    sizeof (la_wwn_t));
2693 	fcip_rt_update(fptr, &map, 1);
2694 	mutex_enter(&fptr->fcip_rt_mutex);
2695 	frp = fcip_lookup_rtable(fptr, &fcmd->req_pwwn, FCIP_COMPARE_NWWN);
2696 	mutex_exit(&fptr->fcip_rt_mutex);
2697 
2698 	fdestp = fcip_add_dest(fptr, frp);
2699 
2700 	fcip_pkt = fcip_ipkt_alloc(fptr, sizeof (la_els_farp_t),
2701 	    sizeof (la_els_farp_t), NULL, KM_SLEEP);
2702 	if (fcip_pkt == NULL) {
2703 		rval = FC_FAILURE;
2704 		goto farp_done;
2705 	}
2706 	/*
2707 	 * Fill in our port's PWWN and NWWN
2708 	 */
2709 	fcmd->resp_pwwn = fport->fcipp_pwwn;
2710 	fcmd->resp_nwwn = fport->fcipp_nwwn;
2711 
2712 	fcip_init_unicast_pkt(fcip_pkt, fport->fcipp_sid,
2713 	    fcmd->req_id, NULL);
2714 
2715 	fca_dev =
2716 	    fc_ulp_get_fca_device(fport->fcipp_handle, fcmd->req_id);
2717 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
2718 	fc_pkt->pkt_cmd_fhdr.r_ctl = R_CTL_ELS_RSP;
2719 	fc_pkt->pkt_fca_device = fca_dev;
2720 	fcip_pkt->fcip_pkt_dest = fdestp;
2721 
2722 	/*
2723 	 * Attempt a PLOGI again
2724 	 */
2725 	if (fcmd->resp_flags & FARP_INIT_P_LOGI) {
2726 		if (fcip_do_plogi(fptr, frp) != FC_SUCCESS) {
2727 			/*
2728 			 * Login to the remote port failed. There is no
2729 			 * point continuing with the FARP request further
2730 			 * so bail out here.
2731 			 */
2732 			frp->fcipr_state = PORT_DEVICE_INVALID;
2733 			rval = FC_FAILURE;
2734 			goto farp_done;
2735 		}
2736 	}
2737 
2738 	FCIP_CP_OUT(fcmd, fc_pkt->pkt_cmd, fc_pkt->pkt_cmd_acc,
2739 	    sizeof (la_els_farp_t));
2740 
2741 	rval = fc_ulp_issue_els(fport->fcipp_handle, fc_pkt);
2742 	if (rval != FC_SUCCESS) {
2743 		FCIP_TNF_PROBE_2((fcip_handle_farp_request, "fcip io",
2744 		    /* CSTYLED */, tnf_string, msg,
2745 		    "fcip_transport of farp reply failed",
2746 		    tnf_uint, rval, rval));
2747 		FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_WARN,
2748 		    "fcip_transport of farp reply failed 0x%x", rval));
2749 	}
2750 
2751 farp_done:
2752 	return (rval);
2753 }
2754 
2755 
2756 /*
2757  * Handle FARP responses to our FARP requests. When we receive a FARP
2758  * reply, we need to add the entry for the Port that replied into our
2759  * routing and destination hash tables. It is possible that the remote
2760  * port did not login into us (FARP responses can be received without
2761  * a PLOGI)
2762  */
2763 static int
2764 fcip_handle_farp_response(struct fcip *fptr, la_els_farp_t *fcmd)
2765 {
2766 	int			rval = FC_FAILURE;
2767 	fc_portmap_t 		map;
2768 	struct fcip_routing_table *frp;
2769 	struct fcip_dest *fdestp;
2770 
2771 	/*
2772 	 * Add an entry for the remote port into our routing and destination
2773 	 * tables.
2774 	 */
2775 	map.map_did = fcmd->dest_id;
2776 	map.map_hard_addr.hard_addr = fcmd->dest_id.port_id;
2777 	map.map_state = PORT_DEVICE_VALID;
2778 	map.map_type = PORT_DEVICE_NEW;
2779 	map.map_flags = 0;
2780 	map.map_pd = NULL;
2781 	bcopy((void *)&fcmd->resp_pwwn, (void *)&map.map_pwwn,
2782 	    sizeof (la_wwn_t));
2783 	bcopy((void *)&fcmd->resp_nwwn, (void *)&map.map_nwwn,
2784 	    sizeof (la_wwn_t));
2785 	fcip_rt_update(fptr, &map, 1);
2786 	mutex_enter(&fptr->fcip_rt_mutex);
2787 	frp = fcip_lookup_rtable(fptr, &fcmd->resp_pwwn, FCIP_COMPARE_NWWN);
2788 	mutex_exit(&fptr->fcip_rt_mutex);
2789 
2790 	fdestp = fcip_add_dest(fptr, frp);
2791 
2792 	if (fdestp != NULL) {
2793 		rval = FC_SUCCESS;
2794 	}
2795 	return (rval);
2796 }
2797 
2798 
2799 #define	FCIP_HDRS_LENGTH	\
2800 	sizeof (fcph_network_hdr_t)+sizeof (llc_snap_hdr_t)+sizeof (ipha_t)
2801 
2802 /*
2803  * fcip_data_cb is the heart of most IP operations. This routine is called
2804  * by the transport when any unsolicited IP data arrives at a port (which
2805  * is almost all IP data). This routine then strips off the Network header
2806  * from the payload (after authenticating the received payload ofcourse),
2807  * creates a message blk and sends the data upstream. You will see ugly
2808  * #defines because of problems with using esballoc() as opposed to
2809  * allocb to prevent an extra copy of data. We should probably move to
2810  * esballoc entirely when the MTU eventually will be larger than 1500 bytes
2811  * since copies will get more expensive then. At 1500 byte MTUs, there is
2812  * no noticable difference between using allocb and esballoc. The other
2813  * caveat is that the qlc firmware still cannot tell us accurately the
2814  * no. of valid bytes in the unsol buffer it DMA'ed so we have to resort
2815  * to looking into the IP header and hoping that the no. of bytes speficified
2816  * in the header was actually received.
2817  */
2818 /* ARGSUSED */
2819 static int
2820 fcip_data_cb(opaque_t ulp_handle, opaque_t phandle,
2821     fc_unsol_buf_t *buf, uint32_t claimed)
2822 {
2823 	fcip_port_info_t		*fport;
2824 	struct fcip 			*fptr;
2825 	fcph_network_hdr_t		*nhdr;
2826 	llc_snap_hdr_t			*snaphdr;
2827 	mblk_t				*bp;
2828 	uint32_t 			len;
2829 	uint32_t			hdrlen;
2830 	ushort_t			type;
2831 	ipha_t				*iphdr;
2832 	int				rval;
2833 
2834 #ifdef FCIP_ESBALLOC
2835 	frtn_t				*free_ubuf;
2836 	struct fcip_esballoc_arg	*fesb_argp;
2837 #endif /* FCIP_ESBALLOC */
2838 
2839 	fport = fcip_get_port(phandle);
2840 	if (fport == NULL) {
2841 		return (FC_UNCLAIMED);
2842 	}
2843 
2844 	fptr = fport->fcipp_fcip;
2845 	ASSERT(fptr != NULL);
2846 
2847 	if (fptr == NULL) {
2848 		return (FC_UNCLAIMED);
2849 	}
2850 
2851 	mutex_enter(&fptr->fcip_mutex);
2852 	if ((fptr->fcip_flags & (FCIP_DETACHING | FCIP_DETACHED)) ||
2853 	    (fptr->fcip_flags & (FCIP_SUSPENDED | FCIP_POWER_DOWN))) {
2854 		mutex_exit(&fptr->fcip_mutex);
2855 		rval = FC_UNCLAIMED;
2856 		goto data_cb_done;
2857 	}
2858 
2859 	/*
2860 	 * set fcip flags to indicate we are in the middle of a
2861 	 * data callback so we can wait till the statechange
2862 	 * is handled before succeeding/failing the SUSPEND/POWER DOWN.
2863 	 */
2864 	fptr->fcip_flags |= FCIP_IN_DATA_CB;
2865 	mutex_exit(&fptr->fcip_mutex);
2866 
2867 	FCIP_TNF_PROBE_2((fcip_data_cb, "fcip io", /* CSTYLED */,
2868 		tnf_string, msg, "data callback",
2869 		tnf_int, instance, ddi_get_instance(fport->fcipp_dip)));
2870 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2871 	    (CE_NOTE, "fcip%d, data callback",
2872 	    ddi_get_instance(fport->fcipp_dip)));
2873 
2874 	/*
2875 	 * get to the network and snap headers in the payload
2876 	 */
2877 	nhdr = (fcph_network_hdr_t *)buf->ub_buffer;
2878 	snaphdr = (llc_snap_hdr_t *)(buf->ub_buffer +
2879 	    sizeof (fcph_network_hdr_t));
2880 
2881 	hdrlen = sizeof (fcph_network_hdr_t) + sizeof (llc_snap_hdr_t);
2882 
2883 	/*
2884 	 * get the IP header to obtain the no. of bytes we need to read
2885 	 * off from the unsol buffer. This obviously is because not all
2886 	 * data fills up the unsol buffer completely and the firmware
2887 	 * doesn't tell us how many valid bytes are in there as well
2888 	 */
2889 	iphdr = (ipha_t *)(buf->ub_buffer + hdrlen);
2890 	snaphdr->pid = BE_16(snaphdr->pid);
2891 	type = snaphdr->pid;
2892 
2893 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2894 	    (CE_CONT, "SNAPHDR: dsap %x, ssap %x, ctrl %x\n",
2895 	    snaphdr->dsap, snaphdr->ssap, snaphdr->ctrl));
2896 
2897 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2898 	    (CE_CONT, "oui[0] 0x%x oui[1] 0x%x oui[2] 0x%x pid 0x%x\n",
2899 	    snaphdr->oui[0], snaphdr->oui[1], snaphdr->oui[2], snaphdr->pid));
2900 
2901 	/* Authneticate, Authenticate */
2902 	if (type == ETHERTYPE_IP) {
2903 		len = hdrlen + BE_16(iphdr->ipha_length);
2904 	} else if (type == ETHERTYPE_ARP) {
2905 		len = hdrlen + 28;
2906 	} else {
2907 		len = buf->ub_bufsize;
2908 	}
2909 
2910 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2911 	    (CE_CONT, "effective packet length is %d bytes.\n", len));
2912 
2913 	if (len < hdrlen || len > FCIP_UB_SIZE) {
2914 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2915 		    (CE_NOTE, "Incorrect buffer size %d bytes", len));
2916 		rval = FC_UNCLAIMED;
2917 		goto data_cb_done;
2918 	}
2919 
2920 	if (buf->ub_frame.type != FC_TYPE_IS8802_SNAP) {
2921 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM, (CE_NOTE, "Not IP/ARP data"));
2922 		rval = FC_UNCLAIMED;
2923 		goto data_cb_done;
2924 	}
2925 
2926 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM, (CE_NOTE, "checking wwn"));
2927 
2928 	if ((fcip_wwn_compare(&nhdr->net_dest_addr, &fport->fcipp_pwwn,
2929 	    FCIP_COMPARE_NWWN) != 0) &&
2930 	    (!IS_BROADCAST_ADDR(&nhdr->net_dest_addr))) {
2931 		rval = FC_UNCLAIMED;
2932 		goto data_cb_done;
2933 	} else if (fcip_cache_on_arp_broadcast &&
2934 	    IS_BROADCAST_ADDR(&nhdr->net_dest_addr)) {
2935 		fcip_cache_arp_broadcast(fptr, buf);
2936 	}
2937 
2938 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM, (CE_NOTE, "Allocate streams block"));
2939 
2940 	/*
2941 	 * Using esballoc instead of allocb should be faster, atleast at
2942 	 * larger MTUs than 1500 bytes. Someday we'll get there :)
2943 	 */
2944 #if defined(FCIP_ESBALLOC)
2945 	/*
2946 	 * allocate memory for the frtn function arg. The Function
2947 	 * (fcip_ubfree) arg is a struct fcip_esballoc_arg type
2948 	 * which contains pointers to the unsol buffer and the
2949 	 * opaque port handle for releasing the unsol buffer back to
2950 	 * the FCA for reuse
2951 	 */
2952 	fesb_argp = (struct fcip_esballoc_arg *)
2953 	    kmem_zalloc(sizeof (struct fcip_esballoc_arg), KM_NOSLEEP);
2954 
2955 	if (fesb_argp == NULL) {
2956 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2957 		    (CE_WARN, "esballoc of mblk failed in data_cb"));
2958 		rval = FC_UNCLAIMED;
2959 		goto data_cb_done;
2960 	}
2961 	/*
2962 	 * Check with KM_NOSLEEP
2963 	 */
2964 	free_ubuf = (frtn_t *)kmem_zalloc(sizeof (frtn_t), KM_NOSLEEP);
2965 	if (free_ubuf == NULL) {
2966 		kmem_free(fesb_argp, sizeof (struct fcip_esballoc_arg));
2967 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2968 		    (CE_WARN, "esballoc of mblk failed in data_cb"));
2969 		rval = FC_UNCLAIMED;
2970 		goto data_cb_done;
2971 	}
2972 
2973 	fesb_argp->frtnp = free_ubuf;
2974 	fesb_argp->buf = buf;
2975 	fesb_argp->phandle = phandle;
2976 	free_ubuf->free_func = fcip_ubfree;
2977 	free_ubuf->free_arg = (char *)fesb_argp;
2978 	if ((bp = (mblk_t *)esballoc((unsigned char *)buf->ub_buffer,
2979 	    len, BPRI_MED, free_ubuf)) == NULL) {
2980 		kmem_free(fesb_argp, sizeof (struct fcip_esballoc_arg));
2981 		kmem_free(free_ubuf, sizeof (frtn_t));
2982 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2983 		    (CE_WARN, "esballoc of mblk failed in data_cb"));
2984 		rval = FC_UNCLAIMED;
2985 		goto data_cb_done;
2986 	}
2987 #elif !defined(FCIP_ESBALLOC)
2988 	/*
2989 	 * allocate streams mblk and copy the contents of the
2990 	 * unsolicited buffer into this newly alloc'ed mblk
2991 	 */
2992 	if ((bp = (mblk_t *)fcip_allocb((size_t)len, BPRI_LO)) == NULL) {
2993 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
2994 		    (CE_WARN, "alloc of mblk failed in data_cb"));
2995 		rval = FC_UNCLAIMED;
2996 		goto data_cb_done;
2997 	}
2998 
2999 	/*
3000 	 * Unsolicited buffers handed up to us from the FCA must be
3001 	 * endian clean so just bcopy the data into our mblk. Else
3002 	 * we may have to either copy the data byte by byte or
3003 	 * use the ddi_rep_get* routines to do the copy for us.
3004 	 */
3005 	bcopy(buf->ub_buffer, bp->b_rptr, len);
3006 
3007 	/*
3008 	 * for esballoc'ed mblks - free the UB in the frtn function
3009 	 * along with the memory allocated for the function arg.
3010 	 * for allocb'ed mblk - release the unsolicited buffer here
3011 	 */
3012 	(void) fc_ulp_ubrelease(phandle, 1, &buf->ub_token);
3013 
3014 #endif	/* FCIP_ESBALLOC */
3015 
3016 	bp->b_wptr = bp->b_rptr + len;
3017 	fptr->fcip_ipackets++;
3018 
3019 	if (type == ETHERTYPE_IP) {
3020 		mutex_enter(&fptr->fcip_mutex);
3021 		fptr->fcip_ub_upstream++;
3022 		mutex_exit(&fptr->fcip_mutex);
3023 		bp->b_rptr += hdrlen;
3024 
3025 		/*
3026 		 * Check if ipq is valid in the sendup thread
3027 		 */
3028 		if (fcip_sendup_alloc_enque(fptr, bp, NULL) != FC_SUCCESS) {
3029 			freemsg(bp);
3030 		}
3031 	} else {
3032 		/*
3033 		 * We won't get ethernet 802.3 packets in FCIP but we may get
3034 		 * types other than ETHERTYPE_IP, such as ETHERTYPE_ARP. Let
3035 		 * fcip_sendup() do the matching.
3036 		 */
3037 		mutex_enter(&fptr->fcip_mutex);
3038 		fptr->fcip_ub_upstream++;
3039 		mutex_exit(&fptr->fcip_mutex);
3040 		if (fcip_sendup_alloc_enque(fptr, bp,
3041 		    fcip_accept) != FC_SUCCESS) {
3042 			freemsg(bp);
3043 		}
3044 	}
3045 
3046 	rval = FC_SUCCESS;
3047 
3048 	/*
3049 	 * Unset fcip_flags to indicate we are out of callback and return
3050 	 */
3051 data_cb_done:
3052 	mutex_enter(&fptr->fcip_mutex);
3053 	fptr->fcip_flags &= ~(FCIP_IN_DATA_CB);
3054 	mutex_exit(&fptr->fcip_mutex);
3055 	return (rval);
3056 }
3057 
3058 #if !defined(FCIP_ESBALLOC)
3059 /*
3060  * Allocate a message block for the inbound data to be sent upstream.
3061  */
3062 static void *
3063 fcip_allocb(size_t size, uint_t pri)
3064 {
3065 	mblk_t	*mp;
3066 
3067 	if ((mp = allocb(size, pri)) == NULL) {
3068 		return (NULL);
3069 	}
3070 	return (mp);
3071 }
3072 
3073 #endif
3074 
3075 /*
3076  * This helper routine kmem cache alloc's a sendup element for enquing
3077  * into the sendup list for callbacks upstream from the dedicated sendup
3078  * thread. We enque the msg buf into the sendup list and cv_signal the
3079  * sendup thread to finish the callback for us.
3080  */
3081 static int
3082 fcip_sendup_alloc_enque(struct fcip *fptr, mblk_t *mp, struct fcipstr *(*f)())
3083 {
3084 	struct fcip_sendup_elem 	*msg_elem;
3085 	int				rval = FC_FAILURE;
3086 
3087 	FCIP_TNF_PROBE_1((fcip_sendup_alloc_enque, "fcip io", /* CSTYLED */,
3088 		tnf_string, msg, "sendup msg enque"));
3089 	msg_elem = kmem_cache_alloc(fptr->fcip_sendup_cache, KM_NOSLEEP);
3090 	if (msg_elem == NULL) {
3091 		/* drop pkt to floor - update stats */
3092 		rval = FC_FAILURE;
3093 		goto sendup_alloc_done;
3094 	}
3095 	msg_elem->fcipsu_mp = mp;
3096 	msg_elem->fcipsu_func = f;
3097 
3098 	mutex_enter(&fptr->fcip_sendup_mutex);
3099 	if (fptr->fcip_sendup_head == NULL) {
3100 		fptr->fcip_sendup_head = fptr->fcip_sendup_tail = msg_elem;
3101 	} else {
3102 		fptr->fcip_sendup_tail->fcipsu_next = msg_elem;
3103 		fptr->fcip_sendup_tail = msg_elem;
3104 	}
3105 	fptr->fcip_sendup_cnt++;
3106 	cv_signal(&fptr->fcip_sendup_cv);
3107 	mutex_exit(&fptr->fcip_sendup_mutex);
3108 	rval = FC_SUCCESS;
3109 
3110 sendup_alloc_done:
3111 	return (rval);
3112 }
3113 
3114 /*
3115  * One of the ways of performing the WWN to D_ID mapping required for
3116  * IPFC data is to cache the unsolicited ARP broadcast messages received
3117  * and update the routing table to add entry for the destination port
3118  * if we are the intended recipient of the ARP broadcast message. This is
3119  * one of the methods recommended in the rfc to obtain the WWN to D_ID mapping
3120  * but is not typically used unless enabled. The driver prefers to use the
3121  * nameserver/lilp map to obtain this mapping.
3122  */
3123 static void
3124 fcip_cache_arp_broadcast(struct fcip *fptr, fc_unsol_buf_t *buf)
3125 {
3126 	fcip_port_info_t		*fport;
3127 	fcph_network_hdr_t		*nhdr;
3128 	struct fcip_routing_table	*frp;
3129 	fc_portmap_t			map;
3130 
3131 	fport = fptr->fcip_port_info;
3132 	if (fport == NULL) {
3133 		return;
3134 	}
3135 	ASSERT(fport != NULL);
3136 
3137 	nhdr = (fcph_network_hdr_t *)buf->ub_buffer;
3138 
3139 	mutex_enter(&fptr->fcip_rt_mutex);
3140 	frp = fcip_lookup_rtable(fptr, &nhdr->net_src_addr, FCIP_COMPARE_NWWN);
3141 	mutex_exit(&fptr->fcip_rt_mutex);
3142 	if (frp == NULL) {
3143 		map.map_did.port_id = buf->ub_frame.s_id;
3144 		map.map_hard_addr.hard_addr = buf->ub_frame.s_id;
3145 		map.map_state = PORT_DEVICE_VALID;
3146 		map.map_type = PORT_DEVICE_NEW;
3147 		map.map_flags = 0;
3148 		map.map_pd = NULL;
3149 		bcopy((void *)&nhdr->net_src_addr, (void *)&map.map_pwwn,
3150 		    sizeof (la_wwn_t));
3151 		bcopy((void *)&nhdr->net_src_addr, (void *)&map.map_nwwn,
3152 		    sizeof (la_wwn_t));
3153 		fcip_rt_update(fptr, &map, 1);
3154 		mutex_enter(&fptr->fcip_rt_mutex);
3155 		frp = fcip_lookup_rtable(fptr, &nhdr->net_src_addr,
3156 		    FCIP_COMPARE_NWWN);
3157 		mutex_exit(&fptr->fcip_rt_mutex);
3158 
3159 		(void) fcip_add_dest(fptr, frp);
3160 	}
3161 
3162 }
3163 
3164 /*
3165  * This is a dedicated thread to do callbacks from fcip's data callback
3166  * routines into the modules upstream. The reason for this thread is
3167  * the data callback function can be called from an interrupt context and
3168  * the upstream modules *can* make calls downstream in the same thread
3169  * context. If the call is to a fabric port which is not yet in our
3170  * routing tables, we may have to query the nameserver/fabric for the
3171  * MAC addr to Port_ID mapping which may be blocking calls.
3172  */
3173 static void
3174 fcip_sendup_thr(void *arg)
3175 {
3176 	struct fcip		*fptr = (struct fcip *)arg;
3177 	struct fcip_sendup_elem	*msg_elem;
3178 	queue_t			*ip4q = NULL;
3179 
3180 	CALLB_CPR_INIT(&fptr->fcip_cpr_info, &fptr->fcip_sendup_mutex,
3181 	    callb_generic_cpr, "fcip_sendup_thr");
3182 
3183 	mutex_enter(&fptr->fcip_sendup_mutex);
3184 	for (;;) {
3185 
3186 		while (fptr->fcip_sendup_thr_initted &&
3187 		    fptr->fcip_sendup_head == NULL) {
3188 			CALLB_CPR_SAFE_BEGIN(&fptr->fcip_cpr_info);
3189 			cv_wait(&fptr->fcip_sendup_cv,
3190 			    &fptr->fcip_sendup_mutex);
3191 			CALLB_CPR_SAFE_END(&fptr->fcip_cpr_info,
3192 			    &fptr->fcip_sendup_mutex);
3193 		}
3194 
3195 		if (fptr->fcip_sendup_thr_initted == 0) {
3196 			break;
3197 		}
3198 
3199 		FCIP_TNF_PROBE_1((fcip_sendup_thr, "fcip io", /* CSTYLED */,
3200 		    tnf_string, msg, "fcip sendup thr - new msg"));
3201 
3202 		msg_elem = fptr->fcip_sendup_head;
3203 		fptr->fcip_sendup_head = msg_elem->fcipsu_next;
3204 		msg_elem->fcipsu_next = NULL;
3205 		mutex_exit(&fptr->fcip_sendup_mutex);
3206 
3207 		if (msg_elem->fcipsu_func == NULL) {
3208 			/*
3209 			 * Message for ipq. Check to see if the ipq is
3210 			 * is still valid. Since the thread is asynchronous,
3211 			 * there could have been a close on the stream
3212 			 */
3213 			mutex_enter(&fptr->fcip_mutex);
3214 			if (fptr->fcip_ipq && canputnext(fptr->fcip_ipq)) {
3215 				ip4q = fptr->fcip_ipq;
3216 				mutex_exit(&fptr->fcip_mutex);
3217 				putnext(ip4q, msg_elem->fcipsu_mp);
3218 			} else {
3219 				mutex_exit(&fptr->fcip_mutex);
3220 				freemsg(msg_elem->fcipsu_mp);
3221 			}
3222 		} else {
3223 			fcip_sendup(fptr, msg_elem->fcipsu_mp,
3224 			    msg_elem->fcipsu_func);
3225 		}
3226 
3227 #if !defined(FCIP_ESBALLOC)
3228 		/*
3229 		 * for allocb'ed mblk - decrement upstream count here
3230 		 */
3231 		mutex_enter(&fptr->fcip_mutex);
3232 		ASSERT(fptr->fcip_ub_upstream > 0);
3233 		fptr->fcip_ub_upstream--;
3234 		mutex_exit(&fptr->fcip_mutex);
3235 #endif /* FCIP_ESBALLOC */
3236 
3237 		kmem_cache_free(fptr->fcip_sendup_cache, (void *)msg_elem);
3238 		mutex_enter(&fptr->fcip_sendup_mutex);
3239 		fptr->fcip_sendup_cnt--;
3240 	}
3241 
3242 
3243 #ifndef	__lock_lint
3244 	CALLB_CPR_EXIT(&fptr->fcip_cpr_info);
3245 #else
3246 	mutex_exit(&fptr->fcip_sendup_mutex);
3247 #endif /* __lock_lint */
3248 
3249 	/* Wake up fcip detach thread by the end */
3250 	cv_signal(&fptr->fcip_sendup_cv);
3251 
3252 	thread_exit();
3253 }
3254 
3255 #ifdef FCIP_ESBALLOC
3256 
3257 /*
3258  * called from the stream head when it is done using an unsolicited buffer.
3259  * We release this buffer then to the FCA for reuse.
3260  */
3261 static void
3262 fcip_ubfree(char *arg)
3263 {
3264 	struct fcip_esballoc_arg *fesb_argp = (struct fcip_esballoc_arg *)arg;
3265 	fc_unsol_buf_t	*ubuf;
3266 	frtn_t		*frtnp;
3267 	fcip_port_info_t		*fport;
3268 	struct fcip 			*fptr;
3269 
3270 
3271 	fport = fcip_get_port(fesb_argp->phandle);
3272 	fptr = fport->fcipp_fcip;
3273 
3274 	ASSERT(fesb_argp != NULL);
3275 	ubuf = fesb_argp->buf;
3276 	frtnp = fesb_argp->frtnp;
3277 
3278 
3279 	FCIP_DEBUG(FCIP_DEBUG_UPSTREAM,
3280 	    (CE_WARN, "freeing ubuf after esballoc in fcip_ubfree"));
3281 	(void) fc_ulp_ubrelease(fesb_argp->phandle, 1, &ubuf->ub_token);
3282 
3283 	mutex_enter(&fptr->fcip_mutex);
3284 	ASSERT(fptr->fcip_ub_upstream > 0);
3285 	fptr->fcip_ub_upstream--;
3286 	cv_signal(&fptr->fcip_ub_cv);
3287 	mutex_exit(&fptr->fcip_mutex);
3288 
3289 	kmem_free(frtnp, sizeof (frtn_t));
3290 	kmem_free(fesb_argp, sizeof (struct fcip_esballoc_arg));
3291 }
3292 
3293 #endif /* FCIP_ESBALLOC */
3294 
3295 /*
3296  * handle data other than that of type ETHERTYPE_IP and send it on its
3297  * way upstream to the right streams module to handle
3298  */
3299 static void
3300 fcip_sendup(struct fcip *fptr, mblk_t *mp, struct fcipstr *(*acceptfunc)())
3301 {
3302 	struct fcipstr	*slp, *nslp;
3303 	la_wwn_t	*dhostp;
3304 	mblk_t		*nmp;
3305 	uint32_t 	isgroupaddr;
3306 	int 		type;
3307 	uint32_t	hdrlen;
3308 	fcph_network_hdr_t	*nhdr;
3309 	llc_snap_hdr_t		*snaphdr;
3310 
3311 	FCIP_TNF_PROBE_1((fcip_sendup, "fcip io", /* CSTYLED */,
3312 		tnf_string, msg, "fcip sendup"));
3313 	nhdr = (fcph_network_hdr_t *)mp->b_rptr;
3314 	snaphdr =
3315 	    (llc_snap_hdr_t *)(mp->b_rptr + sizeof (fcph_network_hdr_t));
3316 	dhostp = &nhdr->net_dest_addr;
3317 	type = snaphdr->pid;
3318 	hdrlen = sizeof (fcph_network_hdr_t) + sizeof (llc_snap_hdr_t);
3319 
3320 	/* No group address with fibre channel */
3321 	isgroupaddr = 0;
3322 
3323 	/*
3324 	 * While holding a reader lock on the linked list of streams structures,
3325 	 * attempt to match the address criteria for each stream
3326 	 * and pass up the raw M_DATA ("fastpath") or a DL_UNITDATA_IND.
3327 	 */
3328 
3329 	rw_enter(&fcipstruplock, RW_READER);
3330 
3331 	if ((slp = (*acceptfunc)(fcipstrup, fptr, type, dhostp)) == NULL) {
3332 		rw_exit(&fcipstruplock);
3333 		FCIP_TNF_PROBE_1((fcip_sendup, "fcip io", /* CSTYLED */,
3334 		    tnf_string, msg, "fcip sendup - no slp"));
3335 		freemsg(mp);
3336 		return;
3337 	}
3338 
3339 	/*
3340 	 * Loop on matching open streams until (*acceptfunc)() returns NULL.
3341 	 */
3342 	for (; nslp = (*acceptfunc)(slp->sl_nextp, fptr, type, dhostp);
3343 	    slp = nslp) {
3344 		if (canputnext(slp->sl_rq)) {
3345 			if (nmp = dupmsg(mp)) {
3346 				if ((slp->sl_flags & FCIP_SLFAST) &&
3347 							!isgroupaddr) {
3348 					nmp->b_rptr += hdrlen;
3349 					putnext(slp->sl_rq, nmp);
3350 				} else if (slp->sl_flags & FCIP_SLRAW) {
3351 					/* No headers when FCIP_SLRAW is set */
3352 					putnext(slp->sl_rq, nmp);
3353 				} else if ((nmp = fcip_addudind(fptr, nmp,
3354 				    nhdr, type))) {
3355 					putnext(slp->sl_rq, nmp);
3356 				}
3357 			}
3358 		}
3359 	}
3360 
3361 	/*
3362 	 * Do the last one.
3363 	 */
3364 	if (canputnext(slp->sl_rq)) {
3365 		if (slp->sl_flags & FCIP_SLFAST) {
3366 			mp->b_rptr += hdrlen;
3367 			putnext(slp->sl_rq, mp);
3368 		} else if (slp->sl_flags & FCIP_SLRAW) {
3369 			putnext(slp->sl_rq, mp);
3370 		} else if ((mp = fcip_addudind(fptr, mp, nhdr, type))) {
3371 			putnext(slp->sl_rq, mp);
3372 		}
3373 	} else {
3374 		freemsg(mp);
3375 	}
3376 	FCIP_TNF_PROBE_1((fcip_sendup, "fcip io", /* CSTYLED */,
3377 	    tnf_string, msg, "fcip sendup done"));
3378 
3379 	rw_exit(&fcipstruplock);
3380 }
3381 
3382 /*
3383  * Match the stream based on type and wwn if necessary.
3384  * Destination wwn dhostp is passed to this routine is reserved
3385  * for future usage. We don't need to use it right now since port
3386  * to fcip instance mapping is unique and wwn is already validated when
3387  * packet comes to fcip.
3388  */
3389 /* ARGSUSED */
3390 static struct fcipstr *
3391 fcip_accept(struct fcipstr *slp, struct fcip *fptr, int type, la_wwn_t *dhostp)
3392 {
3393 	t_uscalar_t 	sap;
3394 
3395 	FCIP_TNF_PROBE_1((fcip_accept, "fcip io", /* CSTYLED */,
3396 	    tnf_string, msg, "fcip accept"));
3397 
3398 	for (; slp; slp = slp->sl_nextp) {
3399 		sap = slp->sl_sap;
3400 		FCIP_DEBUG(FCIP_DEBUG_UPSTREAM, (CE_CONT,
3401 		    "fcip_accept: checking next sap = %x, type = %x",
3402 		    sap, type));
3403 
3404 		if ((slp->sl_fcip == fptr) && (type == sap)) {
3405 			return (slp);
3406 		}
3407 	}
3408 	return (NULL);
3409 }
3410 
3411 /*
3412  * Handle DL_UNITDATA_IND messages
3413  */
3414 static mblk_t *
3415 fcip_addudind(struct fcip *fptr, mblk_t *mp, fcph_network_hdr_t *nhdr,
3416     int type)
3417 {
3418 	dl_unitdata_ind_t	*dludindp;
3419 	struct	fcipdladdr	*dlap;
3420 	mblk_t	*nmp;
3421 	int	size;
3422 	uint32_t hdrlen;
3423 	struct ether_addr	src_addr;
3424 	struct ether_addr	dest_addr;
3425 
3426 
3427 	hdrlen = (sizeof (llc_snap_hdr_t) + sizeof (fcph_network_hdr_t));
3428 	mp->b_rptr += hdrlen;
3429 
3430 	FCIP_TNF_PROBE_1((fcip_addudind, "fcip io", /* CSTYLED */,
3431 	    tnf_string, msg, "fcip addudind"));
3432 
3433 	/*
3434 	 * Allocate an M_PROTO mblk for the DL_UNITDATA_IND.
3435 	 */
3436 	size = sizeof (dl_unitdata_ind_t) + FCIPADDRL + FCIPADDRL;
3437 	if ((nmp = allocb(size, BPRI_LO)) == NULL) {
3438 		fptr->fcip_allocbfail++;
3439 		freemsg(mp);
3440 		return (NULL);
3441 	}
3442 	DB_TYPE(nmp) = M_PROTO;
3443 	nmp->b_wptr = nmp->b_datap->db_lim;
3444 	nmp->b_rptr = nmp->b_wptr - size;
3445 
3446 	/*
3447 	 * Construct a DL_UNITDATA_IND primitive.
3448 	 */
3449 	dludindp = (dl_unitdata_ind_t *)nmp->b_rptr;
3450 	dludindp->dl_primitive = DL_UNITDATA_IND;
3451 	dludindp->dl_dest_addr_length = FCIPADDRL;
3452 	dludindp->dl_dest_addr_offset = sizeof (dl_unitdata_ind_t);
3453 	dludindp->dl_src_addr_length = FCIPADDRL;
3454 	dludindp->dl_src_addr_offset = sizeof (dl_unitdata_ind_t) + FCIPADDRL;
3455 	dludindp->dl_group_address = 0;		/* not DL_MULTI */
3456 
3457 	dlap = (struct fcipdladdr *)(nmp->b_rptr + sizeof (dl_unitdata_ind_t));
3458 	wwn_to_ether(&nhdr->net_dest_addr, &dest_addr);
3459 	ether_bcopy(&dest_addr, &dlap->dl_phys);
3460 	dlap->dl_sap = (uint16_t)type;
3461 
3462 	dlap = (struct fcipdladdr *)(nmp->b_rptr + sizeof (dl_unitdata_ind_t)
3463 		+ FCIPADDRL);
3464 	wwn_to_ether(&nhdr->net_src_addr, &src_addr);
3465 	ether_bcopy(&src_addr, &dlap->dl_phys);
3466 	dlap->dl_sap = (uint16_t)type;
3467 
3468 	/*
3469 	 * Link the M_PROTO and M_DATA together.
3470 	 */
3471 	nmp->b_cont = mp;
3472 	return (nmp);
3473 }
3474 
3475 
3476 /*
3477  * The open routine. For clone opens, we return the next available minor
3478  * no. for the stream to use
3479  */
3480 /* ARGSUSED */
3481 static int
3482 fcip_open(queue_t *rq, dev_t *devp, int flag, int sflag, cred_t *credp)
3483 {
3484 	struct fcipstr	*slp;
3485 	struct fcipstr	**prevslp;
3486 	minor_t	minor;
3487 
3488 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE, "in fcip_open"));
3489 	FCIP_TNF_PROBE_1((fcip_open, "fcip io", /* CSTYLED */,
3490 		tnf_string, msg, "enter"));
3491 	/*
3492 	 * We need to ensure that the port driver is loaded before
3493 	 * we proceed
3494 	 */
3495 	if (ddi_hold_installed_driver(ddi_name_to_major(PORT_DRIVER)) == NULL) {
3496 		/* no port driver instances found */
3497 		FCIP_DEBUG(FCIP_DEBUG_STARTUP, (CE_WARN,
3498 		    "!ddi_hold_installed_driver of fp failed\n"));
3499 		return (ENXIO);
3500 	}
3501 	/* serialize opens */
3502 	rw_enter(&fcipstruplock, RW_WRITER);
3503 
3504 	prevslp = &fcipstrup;
3505 	if (sflag == CLONEOPEN) {
3506 		minor = 0;
3507 		for (; (slp = *prevslp) != NULL; prevslp = &slp->sl_nextp) {
3508 			if (minor < slp->sl_minor) {
3509 				break;
3510 			}
3511 			minor ++;
3512 		}
3513 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE,
3514 		    "getmajor returns 0x%x", getmajor(*devp)));
3515 		*devp = makedevice(getmajor(*devp), minor);
3516 	} else {
3517 		minor = getminor(*devp);
3518 	}
3519 
3520 	/*
3521 	 * check if our qp's private area is already initialized. If yes
3522 	 * the stream is already open - just return
3523 	 */
3524 	if (rq->q_ptr) {
3525 		goto done;
3526 	}
3527 
3528 	slp = GETSTRUCT(struct fcipstr, 1);
3529 	slp->sl_minor = minor;
3530 	slp->sl_rq = rq;
3531 	slp->sl_sap = 0;
3532 	slp->sl_flags = 0;
3533 	slp->sl_state = DL_UNATTACHED;
3534 	slp->sl_fcip = NULL;
3535 
3536 	mutex_init(&slp->sl_lock, NULL, MUTEX_DRIVER, NULL);
3537 
3538 	/*
3539 	 * link this new stream entry into list of active streams
3540 	 */
3541 	slp->sl_nextp = *prevslp;
3542 	*prevslp = slp;
3543 
3544 	rq->q_ptr = WR(rq)->q_ptr = (char *)slp;
3545 
3546 	/*
3547 	 * Disable automatic enabling of our write service procedures
3548 	 * we need to control this explicitly. This will prevent
3549 	 * anyone scheduling of our write service procedures.
3550 	 */
3551 	noenable(WR(rq));
3552 
3553 done:
3554 	rw_exit(&fcipstruplock);
3555 	/*
3556 	 * enable our put and service routines on the read side
3557 	 */
3558 	qprocson(rq);
3559 
3560 	/*
3561 	 * There is only one instance of fcip (instance = 0)
3562 	 * for multiple instances of hardware
3563 	 */
3564 	(void) qassociate(rq, 0);	/* don't allow drcompat to be pushed */
3565 	return (0);
3566 }
3567 
3568 /*
3569  * close an opened stream. The minor no. will then be available for
3570  * future opens.
3571  */
3572 /* ARGSUSED */
3573 static int
3574 fcip_close(queue_t *rq, int flag, cred_t *credp)
3575 {
3576 	struct fcipstr *slp;
3577 	struct fcipstr **prevslp;
3578 
3579 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE, "in fcip_close"));
3580 	FCIP_TNF_PROBE_1((fcip_close, "fcip io", /* CSTYLED */,
3581 		tnf_string, msg, "enter"));
3582 	ASSERT(rq);
3583 	/* we should also have the active stream pointer in q_ptr */
3584 	ASSERT(rq->q_ptr);
3585 
3586 	ddi_rele_driver(ddi_name_to_major(PORT_DRIVER));
3587 	/*
3588 	 * disable our put and service procedures. We had enabled them
3589 	 * on open
3590 	 */
3591 	qprocsoff(rq);
3592 	slp = (struct fcipstr *)rq->q_ptr;
3593 
3594 	/*
3595 	 * Implicitly detach stream  a stream from an interface.
3596 	 */
3597 	if (slp->sl_fcip) {
3598 		fcip_dodetach(slp);
3599 	}
3600 
3601 	(void) qassociate(rq, -1);	/* undo association in open */
3602 
3603 	rw_enter(&fcipstruplock, RW_WRITER);
3604 
3605 	/*
3606 	 * unlink this stream from the active stream list and free it
3607 	 */
3608 	for (prevslp = &fcipstrup; (slp = *prevslp) != NULL;
3609 	    prevslp = &slp->sl_nextp) {
3610 		if (slp == (struct fcipstr *)rq->q_ptr) {
3611 			break;
3612 		}
3613 	}
3614 
3615 	/* we should have found slp */
3616 	ASSERT(slp);
3617 
3618 	*prevslp = slp->sl_nextp;
3619 	mutex_destroy(&slp->sl_lock);
3620 	kmem_free(slp, sizeof (struct fcipstr));
3621 	rq->q_ptr = WR(rq)->q_ptr = NULL;
3622 
3623 	rw_exit(&fcipstruplock);
3624 	return (0);
3625 }
3626 
3627 /*
3628  * This is not an extension of the DDI_DETACH request. This routine
3629  * only detaches a stream from an interface
3630  */
3631 static void
3632 fcip_dodetach(struct fcipstr *slp)
3633 {
3634 	struct fcipstr	*tslp;
3635 	struct fcip	*fptr;
3636 
3637 	FCIP_DEBUG(FCIP_DEBUG_DETACH, (CE_NOTE, "in fcip_dodetach"));
3638 	FCIP_TNF_PROBE_1((fcip_dodetach, "fcip io", /* CSTYLED */,
3639 		tnf_string, msg, "enter"));
3640 	ASSERT(slp->sl_fcip != NULL);
3641 
3642 	fptr = slp->sl_fcip;
3643 	slp->sl_fcip = NULL;
3644 
3645 	/*
3646 	 * we don't support promiscuous mode currently but check
3647 	 * for and disable any promiscuous mode operation
3648 	 */
3649 	if (slp->sl_flags & SLALLPHYS) {
3650 		slp->sl_flags &= ~SLALLPHYS;
3651 	}
3652 
3653 	/*
3654 	 * disable ALLMULTI mode if all mulitcast addr are ON
3655 	 */
3656 	if (slp->sl_flags & SLALLMULTI) {
3657 		slp->sl_flags &= ~SLALLMULTI;
3658 	}
3659 
3660 	/*
3661 	 * we are most likely going to perform multicast by
3662 	 * broadcasting to the well known addr (D_ID) 0xFFFFFF or
3663 	 * ALPA 0x00 in case of public loops
3664 	 */
3665 
3666 
3667 	/*
3668 	 * detach unit from device structure.
3669 	 */
3670 	for (tslp = fcipstrup; tslp != NULL; tslp = tslp->sl_nextp) {
3671 		if (tslp->sl_fcip == fptr) {
3672 			break;
3673 		}
3674 	}
3675 	if (tslp == NULL) {
3676 		FCIP_DEBUG(FCIP_DEBUG_DETACH, (CE_WARN,
3677 		"fcip_dodeatch - active stream struct not found"));
3678 
3679 		/* unregister with Fabric nameserver?? */
3680 	}
3681 	slp->sl_state = DL_UNATTACHED;
3682 
3683 	fcip_setipq(fptr);
3684 }
3685 
3686 
3687 /*
3688  * Set or clear device ipq pointer.
3689  * Walk thru all the streams on this device, if a ETHERTYPE_IP
3690  * stream is found, assign device ipq to its sl_rq.
3691  */
3692 static void
3693 fcip_setipq(struct fcip *fptr)
3694 {
3695 	struct fcipstr	*slp;
3696 	int		ok = 1;
3697 	queue_t		*ipq = NULL;
3698 
3699 	FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_NOTE, "entered fcip_setipq"));
3700 
3701 	rw_enter(&fcipstruplock, RW_READER);
3702 
3703 	for (slp = fcipstrup; slp != NULL; slp = slp->sl_nextp) {
3704 		if (slp->sl_fcip == fptr) {
3705 			if (slp->sl_flags & (SLALLPHYS|SLALLSAP)) {
3706 				ok = 0;
3707 			}
3708 			if (slp->sl_sap == ETHERTYPE_IP) {
3709 				if (ipq == NULL) {
3710 					ipq = slp->sl_rq;
3711 				} else {
3712 					ok = 0;
3713 				}
3714 			}
3715 		}
3716 	}
3717 
3718 	rw_exit(&fcipstruplock);
3719 
3720 	if (fcip_check_port_exists(fptr)) {
3721 		/* fptr passed to us is stale */
3722 		return;
3723 	}
3724 
3725 	mutex_enter(&fptr->fcip_mutex);
3726 	if (ok) {
3727 		fptr->fcip_ipq = ipq;
3728 	} else {
3729 		fptr->fcip_ipq = NULL;
3730 	}
3731 	mutex_exit(&fptr->fcip_mutex);
3732 }
3733 
3734 
3735 /* ARGSUSED */
3736 static void
3737 fcip_ioctl(queue_t *wq, mblk_t *mp)
3738 {
3739 	struct iocblk		*iocp = (struct iocblk *)mp->b_rptr;
3740 	struct fcipstr		*slp = (struct fcipstr *)wq->q_ptr;
3741 
3742 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
3743 	    (CE_NOTE, "in fcip ioctl : %d", iocp->ioc_cmd));
3744 	FCIP_TNF_PROBE_1((fcip_ioctl, "fcip io", /* CSTYLED */,
3745 		tnf_string, msg, "enter"));
3746 
3747 	switch (iocp->ioc_cmd) {
3748 	case DLIOCRAW:
3749 		slp->sl_flags |= FCIP_SLRAW;
3750 		miocack(wq, mp, 0, 0);
3751 		break;
3752 
3753 	case DL_IOC_HDR_INFO:
3754 		fcip_dl_ioc_hdr_info(wq, mp);
3755 		break;
3756 
3757 	default:
3758 		miocnak(wq, mp, 0, EINVAL);
3759 		break;
3760 	}
3761 }
3762 
3763 /*
3764  * The streams 'Put' routine.
3765  */
3766 /* ARGSUSED */
3767 static int
3768 fcip_wput(queue_t *wq, mblk_t *mp)
3769 {
3770 	struct fcipstr *slp = (struct fcipstr *)wq->q_ptr;
3771 	struct fcip *fptr;
3772 	struct fcip_dest *fdestp;
3773 	fcph_network_hdr_t *headerp;
3774 
3775 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
3776 	    (CE_NOTE, "in fcip_wput :: type:%x", DB_TYPE(mp)));
3777 
3778 	switch (DB_TYPE(mp)) {
3779 	case M_DATA: {
3780 
3781 		fptr = slp->sl_fcip;
3782 
3783 		if (((slp->sl_flags & (FCIP_SLFAST|FCIP_SLRAW)) == 0) ||
3784 		    (slp->sl_state != DL_IDLE) ||
3785 		    (fptr == NULL)) {
3786 			/*
3787 			 * set error in the message block and send a reply
3788 			 * back upstream. Sun's merror routine does this
3789 			 * for us more cleanly.
3790 			 */
3791 			merror(wq, mp, EPROTO);
3792 			break;
3793 		}
3794 
3795 		/*
3796 		 * if any messages are already enqueued or if the interface
3797 		 * is in promiscuous mode, causing the packets to loop back
3798 		 * up, then enqueue the message. Otherwise just transmit
3799 		 * the message. putq() puts the message on fcip's
3800 		 * write queue and qenable() puts the queue (wq) on
3801 		 * the list of queues to be called by the streams scheduler.
3802 		 */
3803 		if (wq->q_first) {
3804 			(void) putq(wq, mp);
3805 			fptr->fcip_wantw = 1;
3806 			qenable(wq);
3807 		} else if (fptr->fcip_flags & FCIP_PROMISC) {
3808 			/*
3809 			 * Promiscous mode not supported but add this code in
3810 			 * case it will be supported in future.
3811 			 */
3812 			(void) putq(wq, mp);
3813 			qenable(wq);
3814 		} else {
3815 
3816 			headerp = (fcph_network_hdr_t *)mp->b_rptr;
3817 			fdestp = fcip_get_dest(fptr, &headerp->net_dest_addr);
3818 
3819 			if (fdestp == NULL) {
3820 				merror(wq, mp, EPROTO);
3821 				break;
3822 			}
3823 
3824 			ASSERT(fdestp != NULL);
3825 
3826 			(void) fcip_start(wq, mp, fptr, fdestp, KM_SLEEP);
3827 		}
3828 		break;
3829 	}
3830 	case M_PROTO:
3831 	case M_PCPROTO:
3832 		/*
3833 		 * to prevent recursive calls into fcip_proto
3834 		 * (PROTO and PCPROTO messages are handled by fcip_proto)
3835 		 * let the service procedure handle these messages by
3836 		 * calling putq here.
3837 		 */
3838 		(void) putq(wq, mp);
3839 		qenable(wq);
3840 		break;
3841 
3842 	case M_IOCTL:
3843 		fcip_ioctl(wq, mp);
3844 		break;
3845 
3846 	case M_FLUSH:
3847 		if (*mp->b_rptr & FLUSHW) {
3848 			flushq(wq, FLUSHALL);
3849 			*mp->b_rptr &= ~FLUSHW;
3850 		}
3851 		/*
3852 		 * we have both FLUSHW and FLUSHR set with FLUSHRW
3853 		 */
3854 		if (*mp->b_rptr & FLUSHR) {
3855 			/*
3856 			 * send msg back upstream. qreply() takes care
3857 			 * of using the RD(wq) queue on its reply
3858 			 */
3859 			qreply(wq, mp);
3860 		} else {
3861 			freemsg(mp);
3862 		}
3863 		break;
3864 
3865 	default:
3866 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
3867 		    (CE_NOTE, "default msg type: %x", DB_TYPE(mp)));
3868 		freemsg(mp);
3869 		break;
3870 	}
3871 	return (0);
3872 }
3873 
3874 
3875 /*
3876  * Handle M_PROTO and M_PCPROTO messages
3877  */
3878 /* ARGSUSED */
3879 static void
3880 fcip_proto(queue_t *wq, mblk_t *mp)
3881 {
3882 	union DL_primitives	*dlp;
3883 	struct fcipstr		*slp;
3884 	t_uscalar_t		prim;
3885 
3886 	slp = (struct fcipstr *)wq->q_ptr;
3887 	dlp = (union DL_primitives *)mp->b_rptr;
3888 	prim = dlp->dl_primitive;		/* the DLPI command */
3889 
3890 	FCIP_TNF_PROBE_5((fcip_proto, "fcip io", /* CSTYLED */,
3891 		tnf_string, msg, "enter",
3892 		tnf_opaque, wq, wq,
3893 		tnf_opaque, mp, mp,
3894 		tnf_opaque, MP_DB_TYPE, DB_TYPE(mp),
3895 		tnf_opaque, dl_primitive, dlp->dl_primitive));
3896 
3897 	FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_NOTE, "dl_primitve : %x", prim));
3898 
3899 	mutex_enter(&slp->sl_lock);
3900 
3901 	switch (prim) {
3902 	case DL_UNITDATA_REQ:
3903 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3904 			tnf_string, msg, "unit data request"));
3905 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "unit data request"));
3906 		fcip_udreq(wq, mp);
3907 		break;
3908 
3909 	case DL_ATTACH_REQ:
3910 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3911 			tnf_string, msg, "Attach request"));
3912 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "Attach request"));
3913 		fcip_areq(wq, mp);
3914 		break;
3915 
3916 	case DL_DETACH_REQ:
3917 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3918 			tnf_string, msg, "Detach request"));
3919 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "Detach request"));
3920 		fcip_dreq(wq, mp);
3921 		break;
3922 
3923 	case DL_BIND_REQ:
3924 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "Bind request"));
3925 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3926 			tnf_string, msg, "Bind request"));
3927 		fcip_breq(wq, mp);
3928 		break;
3929 
3930 	case DL_UNBIND_REQ:
3931 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3932 			tnf_string, msg, "unbind request"));
3933 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "unbind request"));
3934 		fcip_ubreq(wq, mp);
3935 		break;
3936 
3937 	case DL_INFO_REQ:
3938 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3939 			tnf_string, msg, "Info request"));
3940 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "Info request"));
3941 		fcip_ireq(wq, mp);
3942 		break;
3943 
3944 	case DL_SET_PHYS_ADDR_REQ:
3945 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3946 			tnf_string, msg, "set phy addr request"));
3947 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
3948 		    (CE_NOTE, "set phy addr request"));
3949 		fcip_spareq(wq, mp);
3950 		break;
3951 
3952 	case DL_PHYS_ADDR_REQ:
3953 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3954 			tnf_string, msg, "phy addr request"));
3955 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "phy addr request"));
3956 		fcip_pareq(wq, mp);
3957 		break;
3958 
3959 	case DL_ENABMULTI_REQ:
3960 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3961 			tnf_string, msg, "Enable Multicast request"));
3962 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
3963 		    (CE_NOTE, "Enable Multicast request"));
3964 		dlerrorack(wq, mp, prim, DL_UNSUPPORTED, 0);
3965 		break;
3966 
3967 	case DL_DISABMULTI_REQ:
3968 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3969 			tnf_string, msg, "Disable Multicast request"));
3970 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
3971 		    (CE_NOTE, "Disable Multicast request"));
3972 		dlerrorack(wq, mp, prim, DL_UNSUPPORTED, 0);
3973 		break;
3974 
3975 	case DL_PROMISCON_REQ:
3976 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3977 			tnf_string, msg, "Promiscuous mode ON request"));
3978 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
3979 		    (CE_NOTE, "Promiscuous mode ON request"));
3980 		dlerrorack(wq, mp, prim, DL_UNSUPPORTED, 0);
3981 		break;
3982 
3983 	case DL_PROMISCOFF_REQ:
3984 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3985 			tnf_string, msg, "Promiscuous mode OFF request"));
3986 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
3987 		    (CE_NOTE, "Promiscuous mode OFF request"));
3988 		dlerrorack(wq, mp, prim, DL_UNSUPPORTED, 0);
3989 		break;
3990 
3991 	default:
3992 		FCIP_TNF_PROBE_1((fcip_proto, "fcip io", /* CSTYLED */,
3993 			tnf_string, msg, "Unsupported request"));
3994 		dlerrorack(wq, mp, prim, DL_UNSUPPORTED, 0);
3995 		break;
3996 	}
3997 	mutex_exit(&slp->sl_lock);
3998 }
3999 
4000 /*
4001  * Always enqueue M_PROTO and M_PCPROTO messages pn the wq and M_DATA
4002  * messages sometimes. Processing of M_PROTO and M_PCPROTO messages
4003  * require us to hold fcip's internal locks across (upstream) putnext
4004  * calls. Specifically fcip_intr could hold fcip_intrlock and fcipstruplock
4005  * when it calls putnext(). That thread could loop back around to call
4006  * fcip_wput and eventually fcip_init() to cause a recursive mutex panic
4007  *
4008  * M_DATA messages are enqueued only if we are out of xmit resources. Once
4009  * the transmit resources are available the service procedure is enabled
4010  * and an attempt is made to xmit all messages on the wq.
4011  */
4012 /* ARGSUSED */
4013 static int
4014 fcip_wsrv(queue_t *wq)
4015 {
4016 	mblk_t		*mp;
4017 	struct fcipstr	*slp;
4018 	struct fcip	*fptr;
4019 	struct fcip_dest *fdestp;
4020 	fcph_network_hdr_t *headerp;
4021 
4022 	slp = (struct fcipstr *)wq->q_ptr;
4023 	fptr = slp->sl_fcip;
4024 
4025 	FCIP_TNF_PROBE_2((fcip_wsrv, "fcip io", /* CSTYLED */,
4026 		tnf_string, msg, "enter",
4027 		tnf_opaque, wq, wq));
4028 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE, "fcip wsrv"));
4029 
4030 	while (mp = getq(wq)) {
4031 		switch (DB_TYPE(mp)) {
4032 		case M_DATA:
4033 			if (fptr && mp) {
4034 				headerp = (fcph_network_hdr_t *)mp->b_rptr;
4035 				fdestp = fcip_get_dest(fptr,
4036 				    &headerp->net_dest_addr);
4037 				if (fdestp == NULL) {
4038 					freemsg(mp);
4039 					goto done;
4040 				}
4041 				if (fcip_start(wq, mp, fptr, fdestp,
4042 				    KM_SLEEP)) {
4043 					goto done;
4044 				}
4045 			} else {
4046 				freemsg(mp);
4047 			}
4048 			break;
4049 
4050 		case M_PROTO:
4051 		case M_PCPROTO:
4052 			FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
4053 			    (CE_NOTE, "PROT msg in wsrv"));
4054 			fcip_proto(wq, mp);
4055 			break;
4056 		default:
4057 			break;
4058 		}
4059 	}
4060 done:
4061 	return (0);
4062 }
4063 
4064 
4065 /*
4066  * This routine is called from fcip_wsrv to send a message downstream
4067  * on the fibre towards its destination. This routine performs the
4068  * actual WWN to D_ID mapping by looking up the routing and destination
4069  * tables.
4070  */
4071 /* ARGSUSED */
4072 static int
4073 fcip_start(queue_t *wq, mblk_t *mp, struct fcip *fptr,
4074     struct fcip_dest *fdestp, int flags)
4075 {
4076 	int			rval;
4077 	int			free;
4078 	fcip_pkt_t		*fcip_pkt;
4079 	fc_packet_t		*fc_pkt;
4080 	fcip_port_info_t	*fport = fptr->fcip_port_info;
4081 	size_t			datalen;
4082 
4083 	FCIP_TNF_PROBE_4((fcip_start, "fcip io", /* CSTYLED */,
4084 	    tnf_string, msg, "enter", tnf_opaque, wq, wq,
4085 	    tnf_opaque, mp, mp,
4086 	    tnf_opaque, MP_DB_TYPE, DB_TYPE(mp)));
4087 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE, "in fcipstart"));
4088 
4089 	ASSERT(fdestp != NULL);
4090 
4091 	/*
4092 	 * Only return if port has gone offline and not come back online
4093 	 * in a while
4094 	 */
4095 	if (fptr->fcip_flags & FCIP_LINK_DOWN) {
4096 		freemsg(mp);
4097 		return (0);
4098 	}
4099 
4100 	/*
4101 	 * The message block coming in here already has the network and
4102 	 * llc_snap hdr stuffed in
4103 	 */
4104 	/*
4105 	 * Traditionally ethernet drivers at sun handle 3 cases here -
4106 	 * 1. messages with one mblk
4107 	 * 2. messages with 2 mblks
4108 	 * 3. messages with >2 mblks
4109 	 * For now lets handle all the 3 cases in a single case where we
4110 	 * put them together in one mblk that has all the data
4111 	 */
4112 
4113 	if (mp->b_cont != NULL) {
4114 		if (!pullupmsg(mp, -1)) {
4115 			FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
4116 			    (CE_WARN, "failed to concat message"));
4117 			freemsg(mp);
4118 			return (1);
4119 		}
4120 	}
4121 
4122 	datalen = msgsize(mp);
4123 
4124 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE,
4125 	    "msgsize with nhdr & llcsnap hdr in fcip_pkt_alloc 0x%lx",
4126 	    datalen));
4127 
4128 	/*
4129 	 * We cannot have requests larger than FCIPMTU+Headers
4130 	 */
4131 	if (datalen > (FCIPMTU + sizeof (llc_snap_hdr_t) +
4132 		sizeof (fcph_network_hdr_t))) {
4133 		freemsg(mp);
4134 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE,
4135 		    "fcip_pkt_alloc: datalen is larger than "
4136 		    "max possible size."));
4137 		return (1);
4138 	}
4139 
4140 	fcip_pkt = fcip_pkt_alloc(fptr, mp, flags, datalen);
4141 	if (fcip_pkt == NULL) {
4142 		(void) putbq(wq, mp);
4143 		return (1);
4144 	}
4145 
4146 	fcip_pkt->fcip_pkt_mp = mp;
4147 	fcip_pkt->fcip_pkt_wq = wq;
4148 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
4149 
4150 	mutex_enter(&fdestp->fcipd_mutex);
4151 	/*
4152 	 * If the device dynamically disappeared, just fail the request.
4153 	 */
4154 	if (fdestp->fcipd_rtable == NULL) {
4155 		mutex_exit(&fdestp->fcipd_mutex);
4156 		fcip_pkt_free(fcip_pkt, 1);
4157 		return (1);
4158 	}
4159 
4160 	/*
4161 	 * Now that we've assigned pkt_pd, we can call fc_ulp_init_packet
4162 	 */
4163 
4164 	fc_pkt->pkt_pd = fdestp->fcipd_pd;
4165 
4166 	if (fc_ulp_init_packet((opaque_t)fport->fcipp_handle,
4167 	    fc_pkt, flags) != FC_SUCCESS) {
4168 		mutex_exit(&fdestp->fcipd_mutex);
4169 		fcip_pkt_free(fcip_pkt, 1);
4170 		return (1);
4171 	}
4172 
4173 	fcip_fdestp_enqueue_pkt(fdestp, fcip_pkt);
4174 	fcip_pkt->fcip_pkt_dest = fdestp;
4175 	fc_pkt->pkt_fca_device = fdestp->fcipd_fca_dev;
4176 
4177 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE,
4178 	    "setting cmdlen to 0x%x: rsp 0x%x : data 0x%x",
4179 	    fc_pkt->pkt_cmdlen, fc_pkt->pkt_rsplen, fc_pkt->pkt_datalen));
4180 
4181 	fcip_init_unicast_pkt(fcip_pkt, fport->fcipp_sid,
4182 	    fdestp->fcipd_did, fcip_pkt_callback);
4183 
4184 	fdestp->fcipd_ncmds++;
4185 
4186 	mutex_exit(&fdestp->fcipd_mutex);
4187 	if ((rval = fcip_transport(fcip_pkt)) == FC_SUCCESS) {
4188 		fptr->fcip_opackets++;
4189 		return (0);
4190 	}
4191 
4192 	free = (rval == FC_STATEC_BUSY || rval == FC_OFFLINE ||
4193 	    rval == FC_TRAN_BUSY) ? 0 : 1;
4194 
4195 	mutex_enter(&fdestp->fcipd_mutex);
4196 	rval = fcip_fdestp_dequeue_pkt(fdestp, fcip_pkt);
4197 
4198 	if (!rval) {
4199 		fcip_pkt = NULL;
4200 	} else {
4201 		fdestp->fcipd_ncmds--;
4202 	}
4203 	mutex_exit(&fdestp->fcipd_mutex);
4204 
4205 	if (fcip_pkt != NULL) {
4206 		fcip_pkt_free(fcip_pkt, free);
4207 	}
4208 
4209 	if (!free) {
4210 		(void) putbq(wq, mp);
4211 	}
4212 
4213 	return (1);
4214 }
4215 
4216 
4217 /*
4218  * This routine enqueus a packet marked to be issued to the
4219  * transport in the dest structure. This enables us to timeout any
4220  * request stuck with the FCA/transport for long periods of time
4221  * without a response. fcip_pkt_timeout will attempt to clean up
4222  * any packets hung in this state of limbo.
4223  */
4224 static void
4225 fcip_fdestp_enqueue_pkt(struct fcip_dest *fdestp, fcip_pkt_t *fcip_pkt)
4226 {
4227 	ASSERT(mutex_owned(&fdestp->fcipd_mutex));
4228 	FCIP_TNF_PROBE_1((fcip_fdestp_enqueue_pkt, "fcip io", /* CSTYLED */,
4229 		tnf_string, msg, "destp enq pkt"));
4230 
4231 	/*
4232 	 * Just hang it off the head of packet list
4233 	 */
4234 	fcip_pkt->fcip_pkt_next = fdestp->fcipd_head;
4235 	fcip_pkt->fcip_pkt_prev = NULL;
4236 	fcip_pkt->fcip_pkt_flags |= FCIP_PKT_IN_LIST;
4237 
4238 	if (fdestp->fcipd_head != NULL) {
4239 		ASSERT(fdestp->fcipd_head->fcip_pkt_prev == NULL);
4240 		fdestp->fcipd_head->fcip_pkt_prev = fcip_pkt;
4241 	}
4242 
4243 	fdestp->fcipd_head = fcip_pkt;
4244 }
4245 
4246 
4247 /*
4248  * dequeues any packets after the transport/FCA tells us it has
4249  * been successfully sent on its way. Ofcourse it doesn't mean that
4250  * the packet will actually reach its destination but its atleast
4251  * a step closer in that direction
4252  */
4253 static int
4254 fcip_fdestp_dequeue_pkt(struct fcip_dest *fdestp, fcip_pkt_t *fcip_pkt)
4255 {
4256 	fcip_pkt_t	*fcipd_pkt;
4257 
4258 	ASSERT(mutex_owned(&fdestp->fcipd_mutex));
4259 	if (fcip_pkt->fcip_pkt_flags & FCIP_PKT_IN_TIMEOUT) {
4260 		fcipd_pkt = fdestp->fcipd_head;
4261 		while (fcipd_pkt) {
4262 			if (fcipd_pkt == fcip_pkt) {
4263 				fcip_pkt_t	*pptr = NULL;
4264 
4265 				if (fcipd_pkt == fdestp->fcipd_head) {
4266 					ASSERT(fcipd_pkt->fcip_pkt_prev ==
4267 					    NULL);
4268 					fdestp->fcipd_head =
4269 					    fcipd_pkt->fcip_pkt_next;
4270 				} else {
4271 					pptr = fcipd_pkt->fcip_pkt_prev;
4272 					ASSERT(pptr != NULL);
4273 					pptr->fcip_pkt_next =
4274 					    fcipd_pkt->fcip_pkt_next;
4275 				}
4276 				if (fcipd_pkt->fcip_pkt_next) {
4277 					pptr = fcipd_pkt->fcip_pkt_next;
4278 					pptr->fcip_pkt_prev =
4279 					    fcipd_pkt->fcip_pkt_prev;
4280 				}
4281 				fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_LIST;
4282 				break;
4283 			}
4284 			fcipd_pkt = fcipd_pkt->fcip_pkt_next;
4285 		}
4286 	} else {
4287 		if (fcip_pkt->fcip_pkt_prev == NULL) {
4288 			ASSERT(fdestp->fcipd_head == fcip_pkt);
4289 			fdestp->fcipd_head = fcip_pkt->fcip_pkt_next;
4290 		} else {
4291 			fcip_pkt->fcip_pkt_prev->fcip_pkt_next =
4292 			    fcip_pkt->fcip_pkt_next;
4293 		}
4294 
4295 		if (fcip_pkt->fcip_pkt_next) {
4296 			fcip_pkt->fcip_pkt_next->fcip_pkt_prev =
4297 			    fcip_pkt->fcip_pkt_prev;
4298 		}
4299 
4300 		fcipd_pkt = fcip_pkt;
4301 		fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_LIST;
4302 	}
4303 
4304 	return (fcipd_pkt == fcip_pkt);
4305 }
4306 
4307 /*
4308  * The transport routine - this is the routine that actually calls
4309  * into the FCA driver (through the transport ofcourse) to transmit a
4310  * datagram on the fibre. The dest struct assoicated with the port to
4311  * which the data is intended is already bound to the packet, this routine
4312  * only takes care of marking the packet a broadcast packet if it is
4313  * intended to be a broadcast request. This permits the transport to send
4314  * the packet down on the wire even if it doesn't have an entry for the
4315  * D_ID in its d_id hash tables.
4316  */
4317 static int
4318 fcip_transport(fcip_pkt_t *fcip_pkt)
4319 {
4320 	struct fcip		*fptr;
4321 	fc_packet_t		*fc_pkt;
4322 	fcip_port_info_t	*fport;
4323 	struct fcip_dest	*fdestp;
4324 	uint32_t		did;
4325 	int			rval = FC_FAILURE;
4326 	struct fcip_routing_table *frp = NULL;
4327 
4328 	FCIP_TNF_PROBE_1((fcip_transport, "fcip io", /* CSTYLED */,
4329 		tnf_string, msg, "enter"));
4330 
4331 	fptr = fcip_pkt->fcip_pkt_fptr;
4332 	fport = fptr->fcip_port_info;
4333 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
4334 	fdestp = fcip_pkt->fcip_pkt_dest;
4335 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_WARN, "fcip_transport called"));
4336 
4337 	did = fptr->fcip_broadcast_did;
4338 	if (fc_pkt->pkt_cmd_fhdr.d_id == did &&
4339 	    fc_pkt->pkt_tran_type != FC_PKT_BROADCAST) {
4340 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
4341 		    (CE_NOTE, "trantype set to BROADCAST"));
4342 		fc_pkt->pkt_tran_type = FC_PKT_BROADCAST;
4343 	}
4344 
4345 	mutex_enter(&fptr->fcip_mutex);
4346 	if ((fc_pkt->pkt_tran_type != FC_PKT_BROADCAST) &&
4347 	    (fc_pkt->pkt_pd == NULL)) {
4348 		mutex_exit(&fptr->fcip_mutex);
4349 		FCIP_TNF_PROBE_1((fcip_transport, "fcip io", /* CSTYLED */,
4350 		    tnf_string, msg, "fcip transport no pd"));
4351 		return (rval);
4352 	} else if (fptr->fcip_port_state == FCIP_PORT_OFFLINE) {
4353 		mutex_exit(&fptr->fcip_mutex);
4354 		FCIP_TNF_PROBE_1((fcip_transport, "fcip io", /* CSTYLED */,
4355 		    tnf_string, msg, "fcip transport port offline"));
4356 		return (FC_TRAN_BUSY);
4357 	}
4358 	mutex_exit(&fptr->fcip_mutex);
4359 
4360 	if (fdestp) {
4361 		struct fcip_routing_table 	*frp;
4362 
4363 		frp = fdestp->fcipd_rtable;
4364 		mutex_enter(&fptr->fcip_rt_mutex);
4365 		mutex_enter(&fdestp->fcipd_mutex);
4366 		if (fc_pkt->pkt_pd != NULL) {
4367 			if ((frp == NULL) ||
4368 			    (frp && FCIP_RTE_UNAVAIL(frp->fcipr_state))) {
4369 				mutex_exit(&fdestp->fcipd_mutex);
4370 				mutex_exit(&fptr->fcip_rt_mutex);
4371 				if (frp &&
4372 				    (frp->fcipr_state == FCIP_RT_INVALID)) {
4373 					FCIP_TNF_PROBE_1((fcip_transport,
4374 					    "fcip io", /* CSTYLED */,
4375 					    tnf_string, msg,
4376 					    "fcip transport - TRANBUSY"));
4377 					return (FC_TRAN_BUSY);
4378 				} else {
4379 					FCIP_TNF_PROBE_1((fcip_transport,
4380 					    "fcip io", /* CSTYLED */,
4381 					    tnf_string, msg,
4382 					    "fcip transport: frp unavailable"));
4383 					return (rval);
4384 				}
4385 			}
4386 		}
4387 		mutex_exit(&fdestp->fcipd_mutex);
4388 		mutex_exit(&fptr->fcip_rt_mutex);
4389 		ASSERT(fcip_pkt->fcip_pkt_flags & FCIP_PKT_IN_LIST);
4390 	}
4391 
4392 	/* Explicitly invalidate this field till fcip decides to use it */
4393 	fc_pkt->pkt_ulp_rscn_infop = NULL;
4394 
4395 	rval = fc_ulp_transport(fport->fcipp_handle, fc_pkt);
4396 	if (rval == FC_STATEC_BUSY || rval == FC_OFFLINE) {
4397 		/*
4398 		 * Need to queue up the command for retry
4399 		 */
4400 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
4401 		    (CE_WARN, "ulp_transport failed: 0x%x", rval));
4402 	} else if (rval == FC_LOGINREQ && (frp != NULL)) {
4403 		(void) fcip_do_plogi(fptr, frp);
4404 	} else if (rval == FC_BADPACKET && (frp != NULL)) {
4405 		/*
4406 		 * There is a distinct possiblity in our scheme of things
4407 		 * that we have a routing table entry with a NULL pd struct.
4408 		 * Mark the routing table entry for removal if it is not a
4409 		 * broadcast entry
4410 		 */
4411 		if ((frp->fcipr_d_id.port_id != 0x0) &&
4412 		    (frp->fcipr_d_id.port_id != 0xffffff)) {
4413 			mutex_enter(&fptr->fcip_rt_mutex);
4414 			frp->fcipr_pd = NULL;
4415 			frp->fcipr_state = PORT_DEVICE_INVALID;
4416 			mutex_exit(&fptr->fcip_rt_mutex);
4417 		}
4418 	}
4419 
4420 	FCIP_TNF_PROBE_1((fcip_transport, "fcip io", /* CSTYLED */,
4421 	    tnf_string, msg, "fcip transport done"));
4422 	return (rval);
4423 }
4424 
4425 /*
4426  * Call back routine. Called by the FCA/transport when the messages
4427  * has been put onto the wire towards its intended destination. We can
4428  * now free the fc_packet associated with the message
4429  */
4430 static void
4431 fcip_pkt_callback(fc_packet_t *fc_pkt)
4432 {
4433 	int			rval;
4434 	fcip_pkt_t		*fcip_pkt;
4435 	struct fcip_dest	*fdestp;
4436 
4437 	fcip_pkt = (fcip_pkt_t *)fc_pkt->pkt_ulp_private;
4438 	fdestp = fcip_pkt->fcip_pkt_dest;
4439 
4440 	/*
4441 	 * take the lock early so that we don't have a race condition
4442 	 * with fcip_timeout
4443 	 *
4444 	 * fdestp->fcipd_mutex isn't really intended to lock per
4445 	 * packet struct - see bug 5105592 for permanent solution
4446 	 */
4447 	mutex_enter(&fdestp->fcipd_mutex);
4448 
4449 	fcip_pkt->fcip_pkt_flags |= FCIP_PKT_RETURNED;
4450 	fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_ABORT;
4451 	if (fcip_pkt->fcip_pkt_flags & FCIP_PKT_IN_TIMEOUT) {
4452 		mutex_exit(&fdestp->fcipd_mutex);
4453 		return;
4454 	}
4455 
4456 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE, "pkt callback"));
4457 
4458 	ASSERT(fdestp->fcipd_rtable != NULL);
4459 	ASSERT(fcip_pkt->fcip_pkt_flags & FCIP_PKT_IN_LIST);
4460 	rval = fcip_fdestp_dequeue_pkt(fdestp, fcip_pkt);
4461 	fdestp->fcipd_ncmds--;
4462 	mutex_exit(&fdestp->fcipd_mutex);
4463 
4464 	if (rval) {
4465 		fcip_pkt_free(fcip_pkt, 1);
4466 	}
4467 
4468 	FCIP_TNF_PROBE_1((fcip_pkt_callback, "fcip io", /* CSTYLED */,
4469 		tnf_string, msg, "pkt callback done"));
4470 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_NOTE, "pkt callback done"));
4471 }
4472 
4473 /*
4474  * Return 1 if the topology is supported, else return 0.
4475  * Topology support is consistent with what the whole
4476  * stack supports together.
4477  */
4478 static int
4479 fcip_is_supported_fc_topology(int fc_topology)
4480 {
4481 	switch (fc_topology) {
4482 
4483 	case FC_TOP_PRIVATE_LOOP :
4484 	case FC_TOP_PUBLIC_LOOP :
4485 	case FC_TOP_FABRIC :
4486 	case FC_TOP_NO_NS :
4487 		return (1);
4488 	default :
4489 		return (0);
4490 	}
4491 }
4492 
4493 /*
4494  * handle any topology specific initializations here
4495  * this routine must be called while holding fcip_mutex
4496  */
4497 /* ARGSUSED */
4498 static void
4499 fcip_handle_topology(struct fcip *fptr)
4500 {
4501 
4502 	fcip_port_info_t	*fport = fptr->fcip_port_info;
4503 
4504 	ASSERT(mutex_owned(&fptr->fcip_mutex));
4505 
4506 	/*
4507 	 * Since we know the port's topology - handle topology
4508 	 * specific details here. In Point to Point and Private Loop
4509 	 * topologies - we would probably not have a name server
4510 	 */
4511 
4512 	FCIP_TNF_PROBE_3((fcip_handle_topology, "fcip io", /* CSTYLED */,
4513 		tnf_string, msg, "enter",
4514 		tnf_uint, port_state, fport->fcipp_pstate,
4515 		tnf_uint, topology, fport->fcipp_topology));
4516 	FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_NOTE, "port state: %x, topology %x",
4517 		fport->fcipp_pstate, fport->fcipp_topology));
4518 
4519 	fptr->fcip_broadcast_did = fcip_get_broadcast_did(fptr);
4520 	mutex_exit(&fptr->fcip_mutex);
4521 	(void) fcip_dest_add_broadcast_entry(fptr, 0);
4522 	mutex_enter(&fptr->fcip_mutex);
4523 
4524 	if (!fcip_is_supported_fc_topology(fport->fcipp_topology)) {
4525 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4526 		    (CE_WARN, "fcip(0x%x): Unsupported port topology (0x%x)",
4527 		    fptr->fcip_instance, fport->fcipp_topology));
4528 		return;
4529 	}
4530 
4531 	switch (fport->fcipp_topology) {
4532 	case FC_TOP_PRIVATE_LOOP: {
4533 
4534 		fc_portmap_t		*port_map;
4535 		uint32_t		listlen, alloclen;
4536 		/*
4537 		 * we may have to maintain routing. Get a list of
4538 		 * all devices on this port that the transport layer is
4539 		 * aware of. Check if any of them is a IS8802 type port,
4540 		 * if yes get its WWN and DID mapping and cache it in
4541 		 * the purport routing table. Since there is no
4542 		 * State Change notification for private loop/point_point
4543 		 * topologies - this table may not be accurate. The static
4544 		 * routing table is updated on a state change callback.
4545 		 */
4546 		FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_WARN, "port state valid!!"));
4547 		fptr->fcip_port_state = FCIP_PORT_ONLINE;
4548 		listlen = alloclen = FCIP_MAX_PORTS;
4549 		port_map = (fc_portmap_t *)
4550 		    kmem_zalloc((FCIP_MAX_PORTS * sizeof (fc_portmap_t)),
4551 		    KM_SLEEP);
4552 		if (fc_ulp_getportmap(fport->fcipp_handle, &port_map,
4553 		    &listlen, FC_ULP_PLOGI_PRESERVE) == FC_SUCCESS) {
4554 			mutex_exit(&fptr->fcip_mutex);
4555 			fcip_rt_update(fptr, port_map, listlen);
4556 			mutex_enter(&fptr->fcip_mutex);
4557 		}
4558 		if (listlen > alloclen) {
4559 			alloclen = listlen;
4560 		}
4561 		kmem_free(port_map, (alloclen * sizeof (fc_portmap_t)));
4562 		/*
4563 		 * Now fall through and register with the transport
4564 		 * that this port is IP capable
4565 		 */
4566 	}
4567 	/* FALLTHROUGH */
4568 	case FC_TOP_NO_NS:
4569 		/*
4570 		 * If we don't have a nameserver, lets wait until we
4571 		 * have to send out a packet to a remote port and then
4572 		 * try and discover the port using ARP/FARP.
4573 		 */
4574 	/* FALLTHROUGH */
4575 	case FC_TOP_PUBLIC_LOOP:
4576 	case FC_TOP_FABRIC: {
4577 		fc_portmap_t	*port_map;
4578 		uint32_t	listlen, alloclen;
4579 
4580 		/* FC_TYPE of 0x05 goes to word 0, LSB */
4581 		fptr->fcip_port_state = FCIP_PORT_ONLINE;
4582 
4583 		if (!(fptr->fcip_flags & FCIP_REG_INPROGRESS)) {
4584 			fptr->fcip_flags |= FCIP_REG_INPROGRESS;
4585 			if (taskq_dispatch(fptr->fcip_tq, fcip_port_ns,
4586 			    fptr, KM_NOSLEEP) == 0) {
4587 				fptr->fcip_flags &= ~FCIP_REG_INPROGRESS;
4588 			}
4589 		}
4590 
4591 		/*
4592 		 * If fcip_create_nodes_on_demand is overridden to force
4593 		 * discovery of all nodes in Fabric/Public loop topologies
4594 		 * we need to query for and obtain all nodes and log into
4595 		 * them as with private loop devices
4596 		 */
4597 		if (!fcip_create_nodes_on_demand) {
4598 			fptr->fcip_port_state = FCIP_PORT_ONLINE;
4599 			listlen = alloclen = FCIP_MAX_PORTS;
4600 			port_map = (fc_portmap_t *)
4601 			    kmem_zalloc((FCIP_MAX_PORTS *
4602 			    sizeof (fc_portmap_t)), KM_SLEEP);
4603 			if (fc_ulp_getportmap(fport->fcipp_handle, &port_map,
4604 			    &listlen, FC_ULP_PLOGI_PRESERVE) == FC_SUCCESS) {
4605 				mutex_exit(&fptr->fcip_mutex);
4606 				fcip_rt_update(fptr, port_map, listlen);
4607 				mutex_enter(&fptr->fcip_mutex);
4608 			}
4609 			if (listlen > alloclen) {
4610 				alloclen = listlen;
4611 			}
4612 			kmem_free(port_map,
4613 			    (alloclen * sizeof (fc_portmap_t)));
4614 		}
4615 		break;
4616 	}
4617 
4618 	default:
4619 		break;
4620 	}
4621 }
4622 
4623 static void
4624 fcip_port_ns(void *arg)
4625 {
4626 	struct	fcip		*fptr = (struct fcip *)arg;
4627 	fcip_port_info_t	*fport = fptr->fcip_port_info;
4628 	fc_ns_cmd_t		ns_cmd;
4629 	uint32_t		types[8];
4630 	ns_rfc_type_t		rfc;
4631 
4632 	mutex_enter(&fptr->fcip_mutex);
4633 	if ((fptr->fcip_flags & (FCIP_DETACHING | FCIP_DETACHED)) ||
4634 	    (fptr->fcip_flags & (FCIP_SUSPENDED | FCIP_POWER_DOWN))) {
4635 		fptr->fcip_flags &= ~FCIP_REG_INPROGRESS;
4636 		mutex_exit(&fptr->fcip_mutex);
4637 		return;
4638 	}
4639 	mutex_exit(&fptr->fcip_mutex);
4640 
4641 	/*
4642 	 * Prepare the Name server structure to
4643 	 * register with the transport in case of
4644 	 * Fabric configuration.
4645 	 */
4646 	bzero(&rfc, sizeof (rfc));
4647 	bzero(types, sizeof (types));
4648 
4649 	types[FC4_TYPE_WORD_POS(FC_TYPE_IS8802_SNAP)] = (1 <<
4650 	    FC4_TYPE_BIT_POS(FC_TYPE_IS8802_SNAP));
4651 
4652 	rfc.rfc_port_id.port_id = fport->fcipp_sid.port_id;
4653 	bcopy(types, rfc.rfc_types, sizeof (types));
4654 
4655 	ns_cmd.ns_flags = 0;
4656 	ns_cmd.ns_cmd = NS_RFT_ID;
4657 	ns_cmd.ns_req_len = sizeof (rfc);
4658 	ns_cmd.ns_req_payload = (caddr_t)&rfc;
4659 	ns_cmd.ns_resp_len = 0;
4660 	ns_cmd.ns_resp_payload = NULL;
4661 
4662 	/*
4663 	 * Perform the Name Server Registration for FC IS8802_SNAP Type.
4664 	 * We don't expect a reply for registering port type
4665 	 */
4666 	(void) fc_ulp_port_ns(fptr->fcip_port_info->fcipp_handle,
4667 		(opaque_t)0, &ns_cmd);
4668 
4669 	mutex_enter(&fptr->fcip_mutex);
4670 	fptr->fcip_flags &= ~FCIP_REG_INPROGRESS;
4671 	mutex_exit(&fptr->fcip_mutex);
4672 }
4673 
4674 /*
4675  * setup this instance of fcip. This routine inits kstats, allocates
4676  * unsolicited buffers, determines' this port's siblings and handles
4677  * topology specific details which includes registering with the name
4678  * server and also setting up the routing table for this port for
4679  * private loops and point to point topologies
4680  */
4681 static int
4682 fcip_init_port(struct fcip *fptr)
4683 {
4684 	int rval = FC_SUCCESS;
4685 	fcip_port_info_t	*fport = fptr->fcip_port_info;
4686 	static char buf[64];
4687 	size_t	tok_buf_size = 0;
4688 
4689 	ASSERT(fport != NULL);
4690 
4691 	FCIP_TNF_PROBE_1((fcip_init_port, "fcip io", /* CSTYLED */,
4692 		tnf_string, msg, "enter"));
4693 	mutex_enter(&fptr->fcip_mutex);
4694 
4695 	/*
4696 	 * setup mac address for this port. Don't be too worried if
4697 	 * the WWN is zero, there is probably nothing attached to
4698 	 * to the port. There is no point allocating unsolicited buffers
4699 	 * for an unused port so return success if we don't have a MAC
4700 	 * address. Do the port init on a state change notification.
4701 	 */
4702 	if (fcip_setup_mac_addr(fptr) == FCIP_INVALID_WWN) {
4703 		fptr->fcip_port_state = FCIP_PORT_OFFLINE;
4704 		rval = FC_SUCCESS;
4705 		goto done;
4706 	}
4707 
4708 	/*
4709 	 * clear routing table hash list for this port
4710 	 */
4711 	fcip_rt_flush(fptr);
4712 
4713 	/*
4714 	 * init kstats for this instance
4715 	 */
4716 	fcip_kstat_init(fptr);
4717 
4718 	/*
4719 	 * Allocate unsolicited buffers
4720 	 */
4721 	fptr->fcip_ub_nbufs = fcip_ub_nbufs;
4722 	tok_buf_size = sizeof (*fptr->fcip_ub_tokens) * fcip_ub_nbufs;
4723 
4724 	FCIP_TNF_PROBE_2((fcip_init_port, "fcip io", /* CSTYLED */,
4725 		tnf_string, msg, "debug",
4726 		tnf_int, tokBufsize, tok_buf_size));
4727 
4728 	FCIP_DEBUG(FCIP_DEBUG_INIT,
4729 	    (CE_WARN, "tokBufsize: 0x%lx", tok_buf_size));
4730 
4731 	fptr->fcip_ub_tokens = kmem_zalloc(tok_buf_size, KM_SLEEP);
4732 
4733 	if (fptr->fcip_ub_tokens == NULL) {
4734 		rval = FC_FAILURE;
4735 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4736 		    (CE_WARN, "fcip(%d): failed to allocate unsol buf",
4737 		    fptr->fcip_instance));
4738 		goto done;
4739 	}
4740 	rval = fc_ulp_uballoc(fport->fcipp_handle, &fptr->fcip_ub_nbufs,
4741 		fcip_ub_size, FC_TYPE_IS8802_SNAP, fptr->fcip_ub_tokens);
4742 
4743 	if (rval != FC_SUCCESS) {
4744 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4745 		    (CE_WARN, "fcip(%d): fc_ulp_uballoc failed with 0x%x!!",
4746 		    fptr->fcip_instance, rval));
4747 	}
4748 
4749 	switch (rval) {
4750 	case FC_SUCCESS:
4751 		break;
4752 
4753 	case FC_OFFLINE:
4754 		fptr->fcip_port_state = FCIP_PORT_OFFLINE;
4755 		rval = FC_FAILURE;
4756 		goto done;
4757 
4758 	case FC_UB_ERROR:
4759 		FCIP_TNF_PROBE_1((fcip_init_port, "fcip io", /* CSTYLED */,
4760 			tnf_string, msg, "invalid ub alloc request"));
4761 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4762 		    (CE_WARN, "invalid ub alloc request !!"));
4763 		rval = FC_FAILURE;
4764 		goto done;
4765 
4766 	case FC_FAILURE:
4767 		/*
4768 		 * requested bytes could not be alloced
4769 		 */
4770 		if (fptr->fcip_ub_nbufs != fcip_ub_nbufs) {
4771 			cmn_err(CE_WARN,
4772 			    "!fcip(0x%x): Failed to alloc unsolicited bufs",
4773 			    ddi_get_instance(fport->fcipp_dip));
4774 			rval = FC_FAILURE;
4775 			goto done;
4776 		}
4777 		break;
4778 
4779 	default:
4780 		rval = FC_FAILURE;
4781 		break;
4782 	}
4783 
4784 	/*
4785 	 * Preallocate a Cache of fcip packets for transmit and receive
4786 	 * We don't want to be holding on to unsolicited buffers while
4787 	 * we transmit the message upstream
4788 	 */
4789 	FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_NOTE, "allocating fcip_pkt cache"));
4790 
4791 	(void) sprintf(buf, "fcip%d_cache", fptr->fcip_instance);
4792 	fptr->fcip_xmit_cache = kmem_cache_create(buf,
4793 		(fport->fcipp_fca_pkt_size + sizeof (fcip_pkt_t)),
4794 		8, fcip_cache_constructor, fcip_cache_destructor,
4795 		NULL, (void *)fport, NULL, 0);
4796 
4797 	(void) sprintf(buf, "fcip%d_sendup_cache", fptr->fcip_instance);
4798 	fptr->fcip_sendup_cache = kmem_cache_create(buf,
4799 		sizeof (struct fcip_sendup_elem),
4800 		8, fcip_sendup_constructor, NULL, NULL, (void *)fport, NULL, 0);
4801 
4802 	if (fptr->fcip_xmit_cache == NULL) {
4803 		FCIP_TNF_PROBE_2((fcip_init_port, "fcip io", /* CSTYLED */,
4804 			tnf_string, msg, "unable to allocate xmit cache",
4805 			tnf_int, instance, fptr->fcip_instance));
4806 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4807 		    (CE_WARN, "fcip%d unable to allocate xmit cache",
4808 		    fptr->fcip_instance));
4809 		rval = FC_FAILURE;
4810 		goto done;
4811 	}
4812 
4813 	/*
4814 	 * We may need to handle routing tables for point to point and
4815 	 * fcal topologies and register with NameServer for Fabric
4816 	 * topologies.
4817 	 */
4818 	fcip_handle_topology(fptr);
4819 	mutex_exit(&fptr->fcip_mutex);
4820 	if (fcip_dest_add_broadcast_entry(fptr, 1) != FC_SUCCESS) {
4821 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4822 		    (CE_WARN, "fcip(0x%x):add broadcast entry failed!!",
4823 		    fptr->fcip_instance));
4824 		mutex_enter(&fptr->fcip_mutex);
4825 		rval = FC_FAILURE;
4826 		goto done;
4827 	}
4828 
4829 	rval = FC_SUCCESS;
4830 	return (rval);
4831 
4832 done:
4833 	/*
4834 	 * we don't always come here from port_attach - so cleanup
4835 	 * anything done in the init_port routine
4836 	 */
4837 	if (fptr->fcip_kstatp) {
4838 		kstat_delete(fptr->fcip_kstatp);
4839 		fptr->fcip_kstatp = NULL;
4840 	}
4841 
4842 	if (fptr->fcip_xmit_cache) {
4843 		kmem_cache_destroy(fptr->fcip_xmit_cache);
4844 		fptr->fcip_xmit_cache = NULL;
4845 	}
4846 
4847 	if (fptr->fcip_sendup_cache) {
4848 		kmem_cache_destroy(fptr->fcip_sendup_cache);
4849 		fptr->fcip_sendup_cache = NULL;
4850 	}
4851 
4852 	/* release unsolicited buffers */
4853 	if (fptr->fcip_ub_tokens) {
4854 		uint64_t	*tokens = fptr->fcip_ub_tokens;
4855 		fptr->fcip_ub_tokens = NULL;
4856 
4857 		mutex_exit(&fptr->fcip_mutex);
4858 		(void) fc_ulp_ubfree(fport->fcipp_handle, fptr->fcip_ub_nbufs,
4859 			tokens);
4860 		kmem_free(tokens, tok_buf_size);
4861 
4862 	} else {
4863 		mutex_exit(&fptr->fcip_mutex);
4864 	}
4865 
4866 	return (rval);
4867 }
4868 
4869 /*
4870  * Sets up a port's MAC address from its WWN
4871  */
4872 static int
4873 fcip_setup_mac_addr(struct fcip *fptr)
4874 {
4875 	fcip_port_info_t	*fport = fptr->fcip_port_info;
4876 
4877 	ASSERT(mutex_owned(&fptr->fcip_mutex));
4878 
4879 	fptr->fcip_addrflags = 0;
4880 
4881 	/*
4882 	 * we cannot choose a MAC address for our interface - we have
4883 	 * to live with whatever node WWN we get (minus the top two
4884 	 * MSbytes for the MAC address) from the transport layer. We will
4885 	 * treat the WWN as our factory MAC address.
4886 	 */
4887 
4888 	if ((fport->fcipp_nwwn.w.wwn_hi != 0) ||
4889 	    (fport->fcipp_nwwn.w.wwn_lo != 0)) {
4890 		char		etherstr[ETHERSTRL];
4891 
4892 		wwn_to_ether(&fport->fcipp_nwwn, &fptr->fcip_macaddr);
4893 		fcip_ether_to_str(&fptr->fcip_macaddr, etherstr);
4894 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4895 		    (CE_NOTE, "setupmacaddr ouraddr %s", etherstr));
4896 
4897 		fptr->fcip_addrflags = (FCIP_FACTADDR_PRESENT |
4898 						FCIP_FACTADDR_USE);
4899 	} else {
4900 		/*
4901 		 * No WWN - just return failure - there's not much
4902 		 * we can do since we cannot set the WWN.
4903 		 */
4904 		FCIP_DEBUG(FCIP_DEBUG_INIT,
4905 		    (CE_WARN, "Port does not have a valid WWN"));
4906 		return (FCIP_INVALID_WWN);
4907 	}
4908 	return (FC_SUCCESS);
4909 }
4910 
4911 
4912 /*
4913  * flush routing table entries
4914  */
4915 static void
4916 fcip_rt_flush(struct fcip *fptr)
4917 {
4918 	int index;
4919 
4920 	mutex_enter(&fptr->fcip_rt_mutex);
4921 	for (index = 0; index < FCIP_RT_HASH_ELEMS; index++) {
4922 		struct fcip_routing_table 	*frtp, *frtp_next;
4923 		frtp = fptr->fcip_rtable[index];
4924 		while (frtp) {
4925 			frtp_next = frtp->fcipr_next;
4926 			kmem_free(frtp, sizeof (struct fcip_routing_table));
4927 			frtp = frtp_next;
4928 		}
4929 		fptr->fcip_rtable[index] = NULL;
4930 	}
4931 	mutex_exit(&fptr->fcip_rt_mutex);
4932 }
4933 
4934 /*
4935  * Free up the fcip softstate and all allocated resources for the
4936  * fcip instance assoicated with a given port driver instance
4937  *
4938  * Given that the list of structures pointed to by fcip_port_head,
4939  * this function is called from multiple sources, and the
4940  * fcip_global_mutex that protects fcip_port_head must be dropped,
4941  * our best solution is to return a value that indicates the next
4942  * port in the list.  This way the caller doesn't need to worry
4943  * about the race condition where it saves off a pointer to the
4944  * next structure in the list and by the time this routine returns,
4945  * that next structure has already been freed.
4946  */
4947 static fcip_port_info_t *
4948 fcip_softstate_free(fcip_port_info_t *fport)
4949 {
4950 	struct fcip		*fptr = NULL;
4951 	int 			instance;
4952 	timeout_id_t		tid;
4953 	opaque_t		phandle = NULL;
4954 	fcip_port_info_t	*prev_fport, *cur_fport, *next_fport = NULL;
4955 
4956 	ASSERT(MUTEX_HELD(&fcip_global_mutex));
4957 
4958 	if (fport) {
4959 		phandle = fport->fcipp_handle;
4960 		fptr = fport->fcipp_fcip;
4961 	} else {
4962 		return (next_fport);
4963 	}
4964 
4965 	if (fptr) {
4966 		mutex_enter(&fptr->fcip_mutex);
4967 		instance = ddi_get_instance(fptr->fcip_dip);
4968 
4969 		/*
4970 		 * dismantle timeout thread for this instance of fcip
4971 		 */
4972 		tid = fptr->fcip_timeout_id;
4973 		fptr->fcip_timeout_id = NULL;
4974 
4975 		mutex_exit(&fptr->fcip_mutex);
4976 		(void) untimeout(tid);
4977 		mutex_enter(&fptr->fcip_mutex);
4978 
4979 		ASSERT(fcip_num_instances >= 0);
4980 		fcip_num_instances--;
4981 
4982 		/*
4983 		 * stop sendup thread
4984 		 */
4985 		mutex_enter(&fptr->fcip_sendup_mutex);
4986 		if (fptr->fcip_sendup_thr_initted) {
4987 			fptr->fcip_sendup_thr_initted = 0;
4988 			cv_signal(&fptr->fcip_sendup_cv);
4989 			cv_wait(&fptr->fcip_sendup_cv,
4990 			    &fptr->fcip_sendup_mutex);
4991 		}
4992 		ASSERT(fptr->fcip_sendup_head == NULL);
4993 		fptr->fcip_sendup_head = fptr->fcip_sendup_tail = NULL;
4994 		mutex_exit(&fptr->fcip_sendup_mutex);
4995 
4996 		/*
4997 		 * dismantle taskq
4998 		 */
4999 		if (fptr->fcip_tq) {
5000 			taskq_t	*tq = fptr->fcip_tq;
5001 
5002 			fptr->fcip_tq = NULL;
5003 
5004 			mutex_exit(&fptr->fcip_mutex);
5005 			taskq_destroy(tq);
5006 			mutex_enter(&fptr->fcip_mutex);
5007 		}
5008 
5009 		if (fptr->fcip_kstatp) {
5010 			kstat_delete(fptr->fcip_kstatp);
5011 			fptr->fcip_kstatp = NULL;
5012 		}
5013 
5014 		/* flush the routing table entries */
5015 		fcip_rt_flush(fptr);
5016 
5017 		if (fptr->fcip_xmit_cache) {
5018 			kmem_cache_destroy(fptr->fcip_xmit_cache);
5019 			fptr->fcip_xmit_cache = NULL;
5020 		}
5021 
5022 		if (fptr->fcip_sendup_cache) {
5023 			kmem_cache_destroy(fptr->fcip_sendup_cache);
5024 			fptr->fcip_sendup_cache = NULL;
5025 		}
5026 
5027 		fcip_cleanup_dest(fptr);
5028 
5029 		/* release unsolicited buffers */
5030 		if (fptr->fcip_ub_tokens) {
5031 			uint64_t	*tokens = fptr->fcip_ub_tokens;
5032 
5033 			fptr->fcip_ub_tokens = NULL;
5034 			mutex_exit(&fptr->fcip_mutex);
5035 			if (phandle) {
5036 				/*
5037 				 * release the global mutex here to
5038 				 * permit any data pending callbacks to
5039 				 * complete. Else we will deadlock in the
5040 				 * FCA waiting for all unsol buffers to be
5041 				 * returned.
5042 				 */
5043 				mutex_exit(&fcip_global_mutex);
5044 				(void) fc_ulp_ubfree(phandle,
5045 				    fptr->fcip_ub_nbufs, tokens);
5046 				mutex_enter(&fcip_global_mutex);
5047 			}
5048 			kmem_free(tokens, (sizeof (*tokens) * fcip_ub_nbufs));
5049 		} else {
5050 			mutex_exit(&fptr->fcip_mutex);
5051 		}
5052 
5053 		mutex_destroy(&fptr->fcip_mutex);
5054 		mutex_destroy(&fptr->fcip_ub_mutex);
5055 		mutex_destroy(&fptr->fcip_rt_mutex);
5056 		mutex_destroy(&fptr->fcip_dest_mutex);
5057 		mutex_destroy(&fptr->fcip_sendup_mutex);
5058 		cv_destroy(&fptr->fcip_farp_cv);
5059 		cv_destroy(&fptr->fcip_sendup_cv);
5060 		cv_destroy(&fptr->fcip_ub_cv);
5061 
5062 		ddi_soft_state_free(fcip_softp, instance);
5063 	}
5064 
5065 	/*
5066 	 * Now dequeue the fcip_port_info from the port list
5067 	 */
5068 	cur_fport = fcip_port_head;
5069 	prev_fport = NULL;
5070 	while (cur_fport != NULL) {
5071 		if (cur_fport == fport) {
5072 			break;
5073 		}
5074 		prev_fport = cur_fport;
5075 		cur_fport = cur_fport->fcipp_next;
5076 	}
5077 
5078 	/*
5079 	 * Assert that we found a port in our port list
5080 	 */
5081 	ASSERT(cur_fport == fport);
5082 
5083 	if (prev_fport) {
5084 		/*
5085 		 * Not the first port in the port list
5086 		 */
5087 		prev_fport->fcipp_next = fport->fcipp_next;
5088 	} else {
5089 		/*
5090 		 * first port
5091 		 */
5092 		fcip_port_head = fport->fcipp_next;
5093 	}
5094 	next_fport = fport->fcipp_next;
5095 	kmem_free(fport, sizeof (fcip_port_info_t));
5096 
5097 	return (next_fport);
5098 }
5099 
5100 
5101 /*
5102  * This is called by transport for any ioctl operations performed
5103  * on the devctl or other transport minor nodes. It is currently
5104  * unused for fcip
5105  */
5106 /* ARGSUSED */
5107 static int
5108 fcip_port_ioctl(opaque_t ulp_handle,  opaque_t port_handle, dev_t dev,
5109 	int cmd, intptr_t data, int mode, cred_t *credp, int *rval,
5110 	uint32_t claimed)
5111 {
5112 	return (FC_UNCLAIMED);
5113 }
5114 
5115 /*
5116  * DL_INFO_REQ - returns information about the DLPI stream to the DLS user
5117  * requesting information about this interface
5118  */
5119 static void
5120 fcip_ireq(queue_t *wq, mblk_t *mp)
5121 {
5122 	struct fcipstr		*slp;
5123 	struct fcip		*fptr;
5124 	dl_info_ack_t		*dlip;
5125 	struct fcipdladdr	*dlap;
5126 	la_wwn_t		*ep;
5127 	int 			size;
5128 	char			etherstr[ETHERSTRL];
5129 
5130 	slp = (struct fcipstr *)wq->q_ptr;
5131 
5132 	fptr = slp->sl_fcip;
5133 
5134 	FCIP_DEBUG(FCIP_DEBUG_DLPI,
5135 	    (CE_NOTE, "fcip_ireq: info request req rcvd"));
5136 
5137 	FCIP_TNF_PROBE_1((fcip_ireq, "fcip io", /* CSTYLED */,
5138 	    tnf_string, msg, "fcip ireq entered"));
5139 
5140 	if (MBLKL(mp) < DL_INFO_REQ_SIZE) {
5141 		dlerrorack(wq, mp, DL_INFO_REQ, DL_BADPRIM, 0);
5142 		return;
5143 	}
5144 
5145 	/*
5146 	 * Exchange current message for a DL_INFO_ACK
5147 	 */
5148 	size = sizeof (dl_info_ack_t) + FCIPADDRL + ETHERADDRL;
5149 	if ((mp = mexchange(wq, mp, size, M_PCPROTO, DL_INFO_ACK)) == NULL) {
5150 		return;
5151 	}
5152 
5153 	/*
5154 	 * FILL in the DL_INFO_ACK fields and reply
5155 	 */
5156 	dlip = (dl_info_ack_t *)mp->b_rptr;
5157 	*dlip = fcip_infoack;
5158 	dlip->dl_current_state = slp->sl_state;
5159 	dlap = (struct fcipdladdr *)(mp->b_rptr + dlip->dl_addr_offset);
5160 	dlap->dl_sap = slp->sl_sap;
5161 
5162 
5163 	if (fptr) {
5164 		fcip_ether_to_str(&fptr->fcip_macaddr, etherstr);
5165 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5166 		    (CE_NOTE, "ireq - our mac: %s", etherstr));
5167 		ether_bcopy(&fptr->fcip_macaddr, &dlap->dl_phys);
5168 	} else {
5169 		bzero((caddr_t)&dlap->dl_phys, ETHERADDRL);
5170 	}
5171 
5172 	ep = (la_wwn_t *)(mp->b_rptr + dlip->dl_brdcst_addr_offset);
5173 	ether_bcopy(&fcip_arpbroadcast_addr, ep);
5174 
5175 	FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "sending back info req.."));
5176 	qreply(wq, mp);
5177 }
5178 
5179 
5180 /*
5181  * To handle DL_UNITDATA_REQ requests.
5182  */
5183 
5184 static void
5185 fcip_udreq(queue_t *wq, mblk_t *mp)
5186 {
5187 	struct fcipstr		*slp;
5188 	struct fcip		*fptr;
5189 	fcip_port_info_t	*fport;
5190 	dl_unitdata_req_t	*dludp;
5191 	mblk_t			*nmp;
5192 	struct fcipdladdr	*dlap;
5193 	fcph_network_hdr_t 	*headerp;
5194 	llc_snap_hdr_t		*lsnap;
5195 	t_uscalar_t		off, len;
5196 	struct fcip_dest	*fdestp;
5197 	la_wwn_t		wwn;
5198 	int			hdr_size;
5199 
5200 	FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "inside fcip_udreq"));
5201 
5202 	FCIP_TNF_PROBE_1((fcip_udreq, "fcip io", /* CSTYLED */,
5203 	    tnf_string, msg, "fcip udreq entered"));
5204 
5205 	slp = (struct fcipstr *)wq->q_ptr;
5206 
5207 	if (slp->sl_state != DL_IDLE) {
5208 		dlerrorack(wq, mp, DL_UNITDATA_REQ, DL_OUTSTATE, 0);
5209 		return;
5210 	}
5211 
5212 	fptr = slp->sl_fcip;
5213 
5214 	if (fptr == NULL) {
5215 		dlerrorack(wq, mp, DL_UNITDATA_REQ, DL_OUTSTATE, 0);
5216 		return;
5217 	}
5218 
5219 	fport = fptr->fcip_port_info;
5220 
5221 	dludp = (dl_unitdata_req_t *)mp->b_rptr;
5222 	off = dludp->dl_dest_addr_offset;
5223 	len = dludp->dl_dest_addr_length;
5224 
5225 	/*
5226 	 * Validate destination address format
5227 	 */
5228 	if (!MBLKIN(mp, off, len) || (len != FCIPADDRL)) {
5229 		dluderrorind(wq, mp, (mp->b_rptr + off), len, DL_BADADDR, 0);
5230 		return;
5231 	}
5232 
5233 	/*
5234 	 * Error if no M_DATA follows
5235 	 */
5236 	nmp = mp->b_cont;
5237 	if (nmp == NULL) {
5238 		dluderrorind(wq, mp, (mp->b_rptr + off), len, DL_BADDATA, 0);
5239 		return;
5240 	}
5241 	dlap = (struct fcipdladdr *)(mp->b_rptr + off);
5242 
5243 	/*
5244 	 * Now get the destination structure for the remote NPORT
5245 	 */
5246 	ether_to_wwn(&dlap->dl_phys, &wwn);
5247 	fdestp = fcip_get_dest(fptr, &wwn);
5248 
5249 	if (fdestp == NULL) {
5250 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE,
5251 		    "udreq - couldn't find dest struct for remote port"));
5252 		dluderrorind(wq, mp, (mp->b_rptr + off), len, DL_BADDATA, 0);
5253 		return;
5254 	}
5255 
5256 	/*
5257 	 * Network header + SAP
5258 	 */
5259 	hdr_size = sizeof (fcph_network_hdr_t) + sizeof (llc_snap_hdr_t);
5260 
5261 	/* DB_REF gives the no. of msgs pointing to this block */
5262 	if ((DB_REF(nmp) == 1) &&
5263 	    (MBLKHEAD(nmp) >= hdr_size) &&
5264 	    (((uintptr_t)mp->b_rptr & 0x1) == 0)) {
5265 		la_wwn_t wwn;
5266 		nmp->b_rptr -= hdr_size;
5267 
5268 		/* first put the network header */
5269 		headerp = (fcph_network_hdr_t *)nmp->b_rptr;
5270 		if (ether_cmp(&dlap->dl_phys, &fcip_arpbroadcast_addr) == 0) {
5271 			ether_to_wwn(&fcipnhbroadcastaddr, &wwn);
5272 		} else {
5273 			ether_to_wwn(&dlap->dl_phys, &wwn);
5274 		}
5275 		bcopy(&wwn, &headerp->net_dest_addr, sizeof (la_wwn_t));
5276 		ether_to_wwn(&fptr->fcip_macaddr, &wwn);
5277 		bcopy(&wwn, &headerp->net_src_addr, sizeof (la_wwn_t));
5278 
5279 		/* Now the snap header */
5280 		lsnap = (llc_snap_hdr_t *)(nmp->b_rptr +
5281 		    sizeof (fcph_network_hdr_t));
5282 		lsnap->dsap = 0xAA;
5283 		lsnap->ssap = 0xAA;
5284 		lsnap->ctrl = 0x03;
5285 		lsnap->oui[0] = 0x00;
5286 		lsnap->oui[1] = 0x00; 	/* 80 */
5287 		lsnap->oui[2] = 0x00;	/* C2 */
5288 		lsnap->pid = BE_16((dlap->dl_sap));
5289 
5290 		freeb(mp);
5291 		mp = nmp;
5292 
5293 	} else {
5294 		la_wwn_t wwn;
5295 
5296 		DB_TYPE(mp) = M_DATA;
5297 		headerp = (fcph_network_hdr_t *)mp->b_rptr;
5298 
5299 		/*
5300 		 * Only fill in the low 48bits of WWN for now - we can
5301 		 * fill in the NAA_ID after we find the port in the
5302 		 * routing tables
5303 		 */
5304 		if (ether_cmp(&dlap->dl_phys, &fcip_arpbroadcast_addr) == 0) {
5305 			ether_to_wwn(&fcipnhbroadcastaddr, &wwn);
5306 		} else {
5307 			ether_to_wwn(&dlap->dl_phys, &wwn);
5308 		}
5309 		bcopy(&wwn, &headerp->net_dest_addr, sizeof (la_wwn_t));
5310 		/* need to send our PWWN */
5311 		bcopy(&fport->fcipp_pwwn, &headerp->net_src_addr,
5312 		    sizeof (la_wwn_t));
5313 
5314 		lsnap = (llc_snap_hdr_t *)(nmp->b_rptr +
5315 		    sizeof (fcph_network_hdr_t));
5316 		lsnap->dsap = 0xAA;
5317 		lsnap->ssap = 0xAA;
5318 		lsnap->ctrl = 0x03;
5319 		lsnap->oui[0] = 0x00;
5320 		lsnap->oui[1] = 0x00;
5321 		lsnap->oui[2] = 0x00;
5322 		lsnap->pid = BE_16(dlap->dl_sap);
5323 
5324 		mp->b_wptr = mp->b_rptr + hdr_size;
5325 	}
5326 
5327 	/*
5328 	 * Ethernet drivers have a lot of gunk here to put the Type
5329 	 * information (for Ethernet encapsulation (RFC 894) or the
5330 	 * Length (for 802.2/802.3) - I guess we'll just ignore that
5331 	 * here.
5332 	 */
5333 
5334 	/*
5335 	 * Start the I/O on this port. If fcip_start failed for some reason
5336 	 * we call putbq in fcip_start so we don't need to check the
5337 	 * return value from fcip_start
5338 	 */
5339 	(void) fcip_start(wq, mp, fptr, fdestp, KM_SLEEP);
5340 }
5341 
5342 /*
5343  * DL_ATTACH_REQ: attaches a PPA with a stream. ATTACH requets are needed
5344  * for style 2 DLS providers to identify the physical medium through which
5345  * the streams communication will happen
5346  */
5347 static void
5348 fcip_areq(queue_t *wq, mblk_t *mp)
5349 {
5350 	struct fcipstr		*slp;
5351 	union DL_primitives	*dlp;
5352 	fcip_port_info_t	*fport;
5353 	struct fcip		*fptr;
5354 	int			ppa;
5355 
5356 	slp = (struct fcipstr *)wq->q_ptr;
5357 	dlp = (union DL_primitives *)mp->b_rptr;
5358 
5359 	if (MBLKL(mp) < DL_ATTACH_REQ_SIZE) {
5360 		dlerrorack(wq, mp, DL_ATTACH_REQ, DL_BADPRIM, 0);
5361 		return;
5362 	}
5363 
5364 	if (slp->sl_state != DL_UNATTACHED) {
5365 		dlerrorack(wq, mp, DL_ATTACH_REQ, DL_OUTSTATE, 0);
5366 		return;
5367 	}
5368 
5369 	ppa = dlp->attach_req.dl_ppa;
5370 	FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "attach req: ppa %x", ppa));
5371 
5372 	/*
5373 	 * check if the PPA is valid
5374 	 */
5375 
5376 	mutex_enter(&fcip_global_mutex);
5377 
5378 	for (fport = fcip_port_head; fport; fport = fport->fcipp_next) {
5379 		if ((fptr = fport->fcipp_fcip) == NULL) {
5380 			continue;
5381 		}
5382 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "ppa %x, inst %x", ppa,
5383 		    ddi_get_instance(fptr->fcip_dip)));
5384 
5385 		if (ppa == ddi_get_instance(fptr->fcip_dip)) {
5386 			FCIP_DEBUG(FCIP_DEBUG_DLPI,
5387 			    (CE_NOTE, "ppa found %x", ppa));
5388 			break;
5389 		}
5390 	}
5391 
5392 	if (fport == NULL) {
5393 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5394 		    (CE_NOTE, "dlerrorack coz fport==NULL"));
5395 
5396 		mutex_exit(&fcip_global_mutex);
5397 
5398 		if (fc_ulp_get_port_handle(ppa) == NULL) {
5399 			dlerrorack(wq, mp, DL_ATTACH_REQ, DL_BADPPA, 0);
5400 			return;
5401 		}
5402 
5403 		/*
5404 		 * Wait for Port attach callback to trigger.  If port_detach
5405 		 * got in while we were waiting, then ddi_get_soft_state
5406 		 * will return NULL, and we'll return error.
5407 		 */
5408 
5409 		delay(drv_usectohz(FCIP_INIT_DELAY));
5410 		mutex_enter(&fcip_global_mutex);
5411 
5412 		fptr = ddi_get_soft_state(fcip_softp, ppa);
5413 		if (fptr == NULL) {
5414 			mutex_exit(&fcip_global_mutex);
5415 			dlerrorack(wq, mp, DL_ATTACH_REQ, DL_BADPPA, 0);
5416 			return;
5417 		}
5418 	}
5419 
5420 	/*
5421 	 * set link to device and update our state
5422 	 */
5423 	slp->sl_fcip = fptr;
5424 	slp->sl_state = DL_UNBOUND;
5425 
5426 	mutex_exit(&fcip_global_mutex);
5427 
5428 #ifdef DEBUG
5429 	mutex_enter(&fptr->fcip_mutex);
5430 	if (fptr->fcip_flags & FCIP_LINK_DOWN) {
5431 		FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_WARN, "port not online yet"));
5432 	}
5433 	mutex_exit(&fptr->fcip_mutex);
5434 #endif
5435 
5436 	dlokack(wq, mp, DL_ATTACH_REQ);
5437 }
5438 
5439 
5440 /*
5441  * DL_DETACH request - detaches a PPA from a stream
5442  */
5443 static void
5444 fcip_dreq(queue_t *wq, mblk_t *mp)
5445 {
5446 	struct fcipstr		*slp;
5447 
5448 	slp = (struct fcipstr *)wq->q_ptr;
5449 
5450 	if (MBLKL(mp) < DL_DETACH_REQ_SIZE) {
5451 		dlerrorack(wq, mp, DL_DETACH_REQ, DL_BADPRIM, 0);
5452 		return;
5453 	}
5454 
5455 	if (slp->sl_state != DL_UNBOUND) {
5456 		dlerrorack(wq, mp, DL_DETACH_REQ, DL_OUTSTATE, 0);
5457 		return;
5458 	}
5459 
5460 	fcip_dodetach(slp);
5461 	dlokack(wq, mp, DL_DETACH_REQ);
5462 }
5463 
5464 /*
5465  * DL_BIND request: requests a DLS provider to bind a DLSAP to the stream.
5466  * DLS users communicate with a physical interface through DLSAPs. Multiple
5467  * DLSAPs can be bound to the same stream (PPA)
5468  */
5469 static void
5470 fcip_breq(queue_t *wq, mblk_t *mp)
5471 {
5472 	struct fcipstr		*slp;
5473 	union DL_primitives	*dlp;
5474 	struct fcip		*fptr;
5475 	struct fcipdladdr	fcipaddr;
5476 	t_uscalar_t		sap;
5477 	int			xidtest;
5478 
5479 	slp = (struct fcipstr *)wq->q_ptr;
5480 
5481 	if (MBLKL(mp) < DL_BIND_REQ_SIZE) {
5482 		dlerrorack(wq, mp, DL_BIND_REQ, DL_BADPRIM, 0);
5483 		return;
5484 	}
5485 
5486 	if (slp->sl_state != DL_UNBOUND) {
5487 		dlerrorack(wq, mp, DL_BIND_REQ, DL_OUTSTATE, 0);
5488 		return;
5489 	}
5490 
5491 	dlp = (union DL_primitives *)mp->b_rptr;
5492 	fptr = slp->sl_fcip;
5493 
5494 	if (fptr == NULL) {
5495 		dlerrorack(wq, mp, DL_BIND_REQ, DL_OUTSTATE, 0);
5496 		return;
5497 	}
5498 
5499 	sap = dlp->bind_req.dl_sap;
5500 	FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "fcip_breq - sap: %x", sap));
5501 	xidtest = dlp->bind_req.dl_xidtest_flg;
5502 
5503 	if (xidtest) {
5504 		dlerrorack(wq, mp, DL_BIND_REQ, DL_NOAUTO, 0);
5505 		return;
5506 	}
5507 
5508 	FCIP_DEBUG(FCIP_DEBUG_DLPI, (CE_NOTE, "DLBIND: sap : %x", sap));
5509 
5510 	if (sap > ETHERTYPE_MAX) {
5511 		dlerrorack(wq, mp, dlp->dl_primitive, DL_BADSAP, 0);
5512 		return;
5513 	}
5514 	/*
5515 	 * save SAP for this stream and change the link state
5516 	 */
5517 	slp->sl_sap = sap;
5518 	slp->sl_state = DL_IDLE;
5519 
5520 	fcipaddr.dl_sap = sap;
5521 	ether_bcopy(&fptr->fcip_macaddr, &fcipaddr.dl_phys);
5522 	dlbindack(wq, mp, sap, &fcipaddr, FCIPADDRL, 0, 0);
5523 
5524 	fcip_setipq(fptr);
5525 }
5526 
5527 /*
5528  * DL_UNBIND request to unbind a previously bound DLSAP, from this stream
5529  */
5530 static void
5531 fcip_ubreq(queue_t *wq, mblk_t *mp)
5532 {
5533 	struct fcipstr	*slp;
5534 
5535 	slp = (struct fcipstr *)wq->q_ptr;
5536 
5537 	if (MBLKL(mp) < DL_UNBIND_REQ_SIZE) {
5538 		dlerrorack(wq, mp, DL_UNBIND_REQ, DL_BADPRIM, 0);
5539 		return;
5540 	}
5541 
5542 	if (slp->sl_state != DL_IDLE) {
5543 		dlerrorack(wq, mp, DL_UNBIND_REQ, DL_OUTSTATE, 0);
5544 		return;
5545 	}
5546 
5547 	slp->sl_state = DL_UNBOUND;
5548 	slp->sl_sap = 0;
5549 
5550 	(void) putnextctl1(RD(wq), M_FLUSH, FLUSHRW);
5551 	dlokack(wq, mp, DL_UNBIND_REQ);
5552 
5553 	fcip_setipq(slp->sl_fcip);
5554 }
5555 
5556 /*
5557  * Return our physical address
5558  */
5559 static void
5560 fcip_pareq(queue_t *wq, mblk_t *mp)
5561 {
5562 	struct fcipstr 		*slp;
5563 	union DL_primitives	*dlp;
5564 	int			type;
5565 	struct fcip		*fptr;
5566 	fcip_port_info_t	*fport;
5567 	struct ether_addr	addr;
5568 
5569 	slp = (struct fcipstr *)wq->q_ptr;
5570 
5571 	if (MBLKL(mp) < DL_PHYS_ADDR_REQ_SIZE) {
5572 		dlerrorack(wq, mp, DL_PHYS_ADDR_REQ, DL_BADPRIM, 0);
5573 		return;
5574 	}
5575 
5576 	dlp = (union DL_primitives *)mp->b_rptr;
5577 	type = dlp->physaddr_req.dl_addr_type;
5578 	fptr = slp->sl_fcip;
5579 
5580 	if (fptr == NULL) {
5581 		dlerrorack(wq, mp, DL_PHYS_ADDR_REQ, DL_OUTSTATE, 0);
5582 		return;
5583 	}
5584 
5585 	fport = fptr->fcip_port_info;
5586 
5587 	switch (type) {
5588 	case DL_FACT_PHYS_ADDR:
5589 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5590 		    (CE_NOTE, "returning factory phys addr"));
5591 		wwn_to_ether(&fport->fcipp_pwwn, &addr);
5592 		break;
5593 
5594 	case DL_CURR_PHYS_ADDR:
5595 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5596 		    (CE_NOTE, "returning current phys addr"));
5597 		ether_bcopy(&fptr->fcip_macaddr, &addr);
5598 		break;
5599 
5600 	default:
5601 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5602 		    (CE_NOTE, "Not known cmd type in phys addr"));
5603 		dlerrorack(wq, mp, DL_PHYS_ADDR_REQ, DL_NOTSUPPORTED, 0);
5604 		return;
5605 	}
5606 	dlphysaddrack(wq, mp, &addr, ETHERADDRL);
5607 }
5608 
5609 /*
5610  * Set physical address DLPI request
5611  */
5612 static void
5613 fcip_spareq(queue_t *wq, mblk_t *mp)
5614 {
5615 	struct fcipstr		*slp;
5616 	union DL_primitives	*dlp;
5617 	t_uscalar_t		off, len;
5618 	struct ether_addr	*addrp;
5619 	la_wwn_t		wwn;
5620 	struct fcip		*fptr;
5621 	fc_ns_cmd_t		fcip_ns_cmd;
5622 
5623 	slp = (struct fcipstr *)wq->q_ptr;
5624 
5625 	if (MBLKL(mp) < DL_SET_PHYS_ADDR_REQ_SIZE) {
5626 		dlerrorack(wq, mp, DL_SET_PHYS_ADDR_REQ, DL_BADPRIM, 0);
5627 		return;
5628 	}
5629 
5630 	dlp = (union DL_primitives *)mp->b_rptr;
5631 	len = dlp->set_physaddr_req.dl_addr_length;
5632 	off = dlp->set_physaddr_req.dl_addr_offset;
5633 
5634 	if (!MBLKIN(mp, off, len)) {
5635 		dlerrorack(wq, mp, DL_SET_PHYS_ADDR_REQ, DL_BADPRIM, 0);
5636 		return;
5637 	}
5638 
5639 	addrp = (struct ether_addr *)(mp->b_rptr + off);
5640 
5641 	/*
5642 	 * If the length of physical address is not correct or address
5643 	 * specified is a broadcast address or multicast addr -
5644 	 * return an error.
5645 	 */
5646 	if ((len != ETHERADDRL) ||
5647 	    ((addrp->ether_addr_octet[0] & 01) == 1) ||
5648 	    (ether_cmp(addrp, &fcip_arpbroadcast_addr) == 0)) {
5649 		dlerrorack(wq, mp, DL_SET_PHYS_ADDR_REQ, DL_BADADDR, 0);
5650 		return;
5651 	}
5652 
5653 	/*
5654 	 * check if a stream is attached to this device. Else return an error
5655 	 */
5656 	if ((fptr = slp->sl_fcip) == NULL) {
5657 		dlerrorack(wq, mp, DL_SET_PHYS_ADDR_REQ, DL_OUTSTATE, 0);
5658 		return;
5659 	}
5660 
5661 	/*
5662 	 * set the new interface local address. We request the transport
5663 	 * layer to change the Port WWN for this device - return an error
5664 	 * if we don't succeed.
5665 	 */
5666 
5667 	ether_to_wwn(addrp, &wwn);
5668 	if (fcip_set_wwn(&wwn) == FC_SUCCESS) {
5669 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5670 		    (CE_WARN, "WWN changed in spareq"));
5671 	} else {
5672 		dlerrorack(wq, mp, DL_SET_PHYS_ADDR_REQ, DL_BADADDR, 0);
5673 	}
5674 
5675 	/*
5676 	 * register The new Port WWN and Node WWN with the transport
5677 	 * and Nameserver. Hope the transport ensures all current I/O
5678 	 * has stopped before actually attempting to register a new
5679 	 * port and Node WWN else we are hosed. Maybe a Link reset
5680 	 * will get everyone's attention.
5681 	 */
5682 	fcip_ns_cmd.ns_flags = 0;
5683 	fcip_ns_cmd.ns_cmd = NS_RPN_ID;
5684 	fcip_ns_cmd.ns_req_len = sizeof (la_wwn_t);
5685 	fcip_ns_cmd.ns_req_payload = (caddr_t)&wwn.raw_wwn[0];
5686 	fcip_ns_cmd.ns_resp_len = 0;
5687 	fcip_ns_cmd.ns_resp_payload = (caddr_t)0;
5688 	if (fc_ulp_port_ns(fptr->fcip_port_info->fcipp_handle,
5689 	    (opaque_t)0, &fcip_ns_cmd) != FC_SUCCESS) {
5690 		FCIP_DEBUG(FCIP_DEBUG_DLPI,
5691 		    (CE_WARN, "setting Port WWN failed"));
5692 		dlerrorack(wq, mp, DL_SET_PHYS_ADDR_REQ, DL_BADPRIM, 0);
5693 		return;
5694 	}
5695 
5696 	dlokack(wq, mp, DL_SET_PHYS_ADDR_REQ);
5697 }
5698 
5699 /*
5700  * change our port's WWN if permitted by hardware
5701  */
5702 /* ARGSUSED */
5703 static int
5704 fcip_set_wwn(la_wwn_t *pwwn)
5705 {
5706 	/*
5707 	 * We're usually not allowed to change the WWN of adapters
5708 	 * but some adapters do permit us to change the WWN - don't
5709 	 * permit setting of WWNs (yet?) - This behavior could be
5710 	 * modified if needed
5711 	 */
5712 	return (FC_FAILURE);
5713 }
5714 
5715 
5716 /*
5717  * This routine fills in the header for fastpath data requests. What this
5718  * does in simple terms is, instead of sending all data through the Unitdata
5719  * request dlpi code paths (which will then append the protocol specific
5720  * header - network and snap headers in our case), the upper layers issue
5721  * a M_IOCTL with a DL_IOC_HDR_INFO request and ask the streams endpoint
5722  * driver to give the header it needs appended and the upper layer
5723  * allocates and fills in the header and calls our put routine
5724  */
5725 static void
5726 fcip_dl_ioc_hdr_info(queue_t *wq, mblk_t *mp)
5727 {
5728 	mblk_t			*nmp;
5729 	struct fcipstr		*slp;
5730 	struct fcipdladdr	*dlap;
5731 	dl_unitdata_req_t	*dlup;
5732 	fcph_network_hdr_t	*headerp;
5733 	la_wwn_t		wwn;
5734 	llc_snap_hdr_t		*lsnap;
5735 	struct fcip		*fptr;
5736 	fcip_port_info_t	*fport;
5737 	t_uscalar_t		off, len;
5738 	size_t			hdrlen;
5739 	int 			error;
5740 
5741 	slp = (struct fcipstr *)wq->q_ptr;
5742 	fptr = slp->sl_fcip;
5743 	if (fptr == NULL) {
5744 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5745 		    (CE_NOTE, "dliochdr : returns EINVAL1"));
5746 		miocnak(wq, mp, 0, EINVAL);
5747 		return;
5748 	}
5749 
5750 	error = miocpullup(mp, sizeof (dl_unitdata_req_t) + FCIPADDRL);
5751 	if (error != 0) {
5752 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5753 		    (CE_NOTE, "dliochdr : returns %d", error));
5754 		miocnak(wq, mp, 0, error);
5755 		return;
5756 	}
5757 
5758 	fport = fptr->fcip_port_info;
5759 
5760 	/*
5761 	 * check if the DL_UNITDATA_REQ destination addr has valid offset
5762 	 * and length values
5763 	 */
5764 	dlup = (dl_unitdata_req_t *)mp->b_cont->b_rptr;
5765 	off = dlup->dl_dest_addr_offset;
5766 	len = dlup->dl_dest_addr_length;
5767 	if (dlup->dl_primitive != DL_UNITDATA_REQ ||
5768 	    !MBLKIN(mp->b_cont, off, len) || (len != FCIPADDRL)) {
5769 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5770 		    (CE_NOTE, "dliochdr : returns EINVAL2"));
5771 		miocnak(wq, mp, 0, EINVAL);
5772 		return;
5773 	}
5774 
5775 	dlap = (struct fcipdladdr *)(mp->b_cont->b_rptr + off);
5776 
5777 	/*
5778 	 * Allocate a new mblk to hold the ether header
5779 	 */
5780 
5781 	/*
5782 	 * setup space for network header
5783 	 */
5784 	hdrlen = (sizeof (llc_snap_hdr_t) + sizeof (fcph_network_hdr_t));
5785 	if ((nmp = allocb(hdrlen, BPRI_MED)) == NULL) {
5786 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5787 		    (CE_NOTE, "dliochdr : returns ENOMEM"));
5788 		miocnak(wq, mp, 0, ENOMEM);
5789 		return;
5790 	}
5791 	nmp->b_wptr += hdrlen;
5792 
5793 	/*
5794 	 * Fill in the Network Hdr and LLC SNAP header;
5795 	 */
5796 	headerp = (fcph_network_hdr_t *)nmp->b_rptr;
5797 	/*
5798 	 * just fill in the Node WWN here - we can fill in the NAA_ID when
5799 	 * we search the routing table
5800 	 */
5801 	if (ether_cmp(&dlap->dl_phys, &fcip_arpbroadcast_addr) == 0) {
5802 		ether_to_wwn(&fcipnhbroadcastaddr, &wwn);
5803 	} else {
5804 		ether_to_wwn(&dlap->dl_phys, &wwn);
5805 	}
5806 	bcopy(&wwn, &headerp->net_dest_addr, sizeof (la_wwn_t));
5807 	bcopy(&fport->fcipp_pwwn, &headerp->net_src_addr, sizeof (la_wwn_t));
5808 	lsnap = (llc_snap_hdr_t *)(nmp->b_rptr + sizeof (fcph_network_hdr_t));
5809 	lsnap->dsap = 0xAA;
5810 	lsnap->ssap = 0xAA;
5811 	lsnap->ctrl = 0x03;
5812 	lsnap->oui[0] = 0x00;
5813 	lsnap->oui[1] = 0x00;
5814 	lsnap->oui[2] = 0x00;
5815 	lsnap->pid = BE_16(dlap->dl_sap);
5816 
5817 	/*
5818 	 * Link new mblk in after the "request" mblks.
5819 	 */
5820 	linkb(mp, nmp);
5821 
5822 	slp->sl_flags |= FCIP_SLFAST;
5823 
5824 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5825 	    (CE_NOTE, "dliochdr : returns success "));
5826 	miocack(wq, mp, msgsize(mp->b_cont), 0);
5827 }
5828 
5829 
5830 /*
5831  * Establish a kmem cache for fcip packets
5832  */
5833 static int
5834 fcip_cache_constructor(void *buf, void *arg, int flags)
5835 {
5836 	fcip_pkt_t		*fcip_pkt = buf;
5837 	fc_packet_t		*fc_pkt;
5838 	fcip_port_info_t	*fport = (fcip_port_info_t *)arg;
5839 	int			(*cb) (caddr_t);
5840 	struct fcip		*fptr;
5841 
5842 	cb = (flags == KM_SLEEP) ? DDI_DMA_SLEEP : DDI_DMA_DONTWAIT;
5843 
5844 	ASSERT(fport != NULL);
5845 
5846 	fptr = fport->fcipp_fcip;
5847 
5848 	/*
5849 	 * we allocated space for our private area at the end of the
5850 	 * fc packet. Make sure we point to it correctly. Ideally we
5851 	 * should just push fc_packet_private to the beginning or end
5852 	 * of the fc_packet structure
5853 	 */
5854 	fcip_pkt->fcip_pkt_next = NULL;
5855 	fcip_pkt->fcip_pkt_prev = NULL;
5856 	fcip_pkt->fcip_pkt_dest = NULL;
5857 	fcip_pkt->fcip_pkt_state = 0;
5858 	fcip_pkt->fcip_pkt_reason = 0;
5859 	fcip_pkt->fcip_pkt_flags = 0;
5860 	fcip_pkt->fcip_pkt_fptr = fptr;
5861 	fcip_pkt->fcip_pkt_dma_flags = 0;
5862 
5863 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
5864 	fc_pkt->pkt_ulp_rscn_infop = NULL;
5865 
5866 	/*
5867 	 * We use pkt_cmd_dma for OUTBOUND requests. We don't expect
5868 	 * any responses for outbound IP data so no need to setup
5869 	 * response or data dma handles.
5870 	 */
5871 	if (ddi_dma_alloc_handle(fport->fcipp_dip,
5872 	    &fport->fcipp_cmd_dma_attr, cb, NULL,
5873 	    &fc_pkt->pkt_cmd_dma) != DDI_SUCCESS) {
5874 		return (FCIP_FAILURE);
5875 	}
5876 
5877 	fc_pkt->pkt_cmd_acc = fc_pkt->pkt_resp_acc = NULL;
5878 	fc_pkt->pkt_fca_private = (opaque_t)((caddr_t)buf +
5879 	    sizeof (fcip_pkt_t));
5880 	fc_pkt->pkt_ulp_private = (opaque_t)fcip_pkt;
5881 
5882 	fc_pkt->pkt_cmd_cookie_cnt = fc_pkt->pkt_resp_cookie_cnt =
5883 	    fc_pkt->pkt_data_cookie_cnt = 0;
5884 	fc_pkt->pkt_cmd_cookie = fc_pkt->pkt_resp_cookie =
5885 	    fc_pkt->pkt_data_cookie = NULL;
5886 
5887 	return (FCIP_SUCCESS);
5888 }
5889 
5890 /*
5891  * destroy the fcip kmem cache
5892  */
5893 static void
5894 fcip_cache_destructor(void *buf, void *arg)
5895 {
5896 	fcip_pkt_t		*fcip_pkt = (fcip_pkt_t *)buf;
5897 	fc_packet_t		*fc_pkt;
5898 	fcip_port_info_t	*fport = (fcip_port_info_t *)arg;
5899 	struct fcip		*fptr;
5900 
5901 	ASSERT(fport != NULL);
5902 
5903 	fptr = fport->fcipp_fcip;
5904 
5905 	ASSERT(fptr == fcip_pkt->fcip_pkt_fptr);
5906 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
5907 
5908 	if (fc_pkt->pkt_cmd_dma) {
5909 		ddi_dma_free_handle(&fc_pkt->pkt_cmd_dma);
5910 	}
5911 }
5912 
5913 /*
5914  * the fcip destination structure is hashed on Node WWN assuming
5915  * a  NAA_ID of 0x1 (IEEE)
5916  */
5917 static struct fcip_dest *
5918 fcip_get_dest(struct fcip *fptr, la_wwn_t *pwwn)
5919 {
5920 	struct fcip_dest	*fdestp = NULL;
5921 	fcip_port_info_t	*fport;
5922 	int			hash_bucket;
5923 	opaque_t		pd;
5924 	int			rval;
5925 	struct fcip_routing_table *frp;
5926 	la_wwn_t		twwn;
5927 	uint32_t		*twwnp = (uint32_t *)&twwn;
5928 
5929 	hash_bucket = FCIP_DEST_HASH(pwwn->raw_wwn);
5930 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5931 	    (CE_NOTE, "get dest hashbucket : 0x%x", hash_bucket));
5932 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5933 	    (CE_NOTE, "0x%x 0x%x 0x%x 0x%x 0x%x 0x%x",
5934 	    pwwn->raw_wwn[2], pwwn->raw_wwn[3], pwwn->raw_wwn[4],
5935 	    pwwn->raw_wwn[5], pwwn->raw_wwn[6], pwwn->raw_wwn[7]));
5936 
5937 	ASSERT(hash_bucket < FCIP_DEST_HASH_ELEMS);
5938 
5939 	if (fcip_check_port_exists(fptr)) {
5940 		/* fptr is stale, return fdestp */
5941 		return (fdestp);
5942 	}
5943 	fport = fptr->fcip_port_info;
5944 
5945 	/*
5946 	 * First check if we have active I/Os going on with the
5947 	 * destination port (an entry would exist in fcip_dest hash table)
5948 	 */
5949 	mutex_enter(&fptr->fcip_dest_mutex);
5950 	fdestp = fptr->fcip_dest[hash_bucket];
5951 	while (fdestp != NULL) {
5952 		mutex_enter(&fdestp->fcipd_mutex);
5953 		if (fdestp->fcipd_rtable) {
5954 			if (fcip_wwn_compare(pwwn, &fdestp->fcipd_pwwn,
5955 			    FCIP_COMPARE_NWWN) == 0) {
5956 				FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
5957 				    (CE_NOTE, "found fdestp"));
5958 				mutex_exit(&fdestp->fcipd_mutex);
5959 				mutex_exit(&fptr->fcip_dest_mutex);
5960 				return (fdestp);
5961 			}
5962 		}
5963 		mutex_exit(&fdestp->fcipd_mutex);
5964 		fdestp = fdestp->fcipd_next;
5965 	}
5966 	mutex_exit(&fptr->fcip_dest_mutex);
5967 
5968 	/*
5969 	 * We did not find the destination port information in our
5970 	 * active port list so search for an entry in our routing
5971 	 * table.
5972 	 */
5973 	mutex_enter(&fptr->fcip_rt_mutex);
5974 	frp = fcip_lookup_rtable(fptr, pwwn, FCIP_COMPARE_NWWN);
5975 	mutex_exit(&fptr->fcip_rt_mutex);
5976 
5977 	if (frp == NULL || (frp && (!FCIP_RTE_UNAVAIL(frp->fcipr_state)) &&
5978 	    frp->fcipr_state != PORT_DEVICE_LOGGED_IN) ||
5979 	    (frp && frp->fcipr_pd == NULL)) {
5980 		/*
5981 		 * No entry for the destination port in our routing
5982 		 * table too. First query the transport to see if it
5983 		 * already has structures for the destination port in
5984 		 * its hash tables. This must be done for all topologies
5985 		 * since we could have retired entries in the hash tables
5986 		 * which may have to be re-added without a statechange
5987 		 * callback happening. Its better to try and get an entry
5988 		 * for the destination port rather than simply failing a
5989 		 * request though it may be an overkill in private loop
5990 		 * topologies.
5991 		 * If a entry for the remote port exists in the transport's
5992 		 * hash tables, we are fine and can add the entry to our
5993 		 * routing and dest hash lists, Else for fabric configs we
5994 		 * query the nameserver if one exists or issue FARP ELS.
5995 		 */
5996 
5997 		/*
5998 		 * We need to do a PortName based Nameserver
5999 		 * query operation. So get the right PortWWN
6000 		 * for the adapter.
6001 		 */
6002 		bcopy(pwwn, &twwn, sizeof (la_wwn_t));
6003 
6004 		/*
6005 		 * Try IEEE Name (Format 1) first, this is the default and
6006 		 * Emulex uses this format.
6007 		 */
6008 		pd = fc_ulp_get_remote_port(fport->fcipp_handle,
6009 					    &twwn, &rval, 1);
6010 
6011 		if (rval != FC_SUCCESS) {
6012 			/*
6013 			 * If IEEE Name (Format 1) query failed, try IEEE
6014 			 * Extended Name (Format 2) which Qlogic uses.
6015 			 * And try port 1 on Qlogic FC-HBA first.
6016 			 * Note: On x86, we need to byte swap the 32-bit
6017 			 * word first, after the modification, swap it back.
6018 			 */
6019 			*twwnp = BE_32(*twwnp);
6020 			twwn.w.nport_id = QLC_PORT_1_ID_BITS;
6021 			twwn.w.naa_id = QLC_PORT_NAA;
6022 			*twwnp = BE_32(*twwnp);
6023 			pd = fc_ulp_get_remote_port(fport->fcipp_handle,
6024 						    &twwn, &rval, 1);
6025 		}
6026 
6027 		if (rval != FC_SUCCESS) {
6028 			/* If still failed, try port 2 on Qlogic FC-HBA. */
6029 			*twwnp = BE_32(*twwnp);
6030 			twwn.w.nport_id = QLC_PORT_2_ID_BITS;
6031 			*twwnp = BE_32(*twwnp);
6032 			pd = fc_ulp_get_remote_port(fport->fcipp_handle,
6033 						    &twwn, &rval, 1);
6034 		}
6035 
6036 		if (rval == FC_SUCCESS) {
6037 			fc_portmap_t	map;
6038 			/*
6039 			 * Add the newly found destination structure
6040 			 * to our routing table. Create a map with
6041 			 * the device we found. We could ask the
6042 			 * transport to give us the list of all
6043 			 * devices connected to our port but we
6044 			 * probably don't need to know all the devices
6045 			 * so let us just constuct a list with only
6046 			 * one device instead.
6047 			 */
6048 
6049 			fc_ulp_copy_portmap(&map, pd);
6050 			fcip_rt_update(fptr, &map, 1);
6051 
6052 			mutex_enter(&fptr->fcip_rt_mutex);
6053 			frp = fcip_lookup_rtable(fptr, pwwn,
6054 			    FCIP_COMPARE_NWWN);
6055 			mutex_exit(&fptr->fcip_rt_mutex);
6056 
6057 			fdestp = fcip_add_dest(fptr, frp);
6058 		} else if (fcip_farp_supported &&
6059 			(FC_TOP_EXTERNAL(fport->fcipp_topology) ||
6060 			(fport->fcipp_topology == FC_TOP_PT_PT))) {
6061 			/*
6062 			 * The Name server request failed so
6063 			 * issue an FARP
6064 			 */
6065 			fdestp = fcip_do_farp(fptr, pwwn, NULL,
6066 				0, 0);
6067 		} else {
6068 		    fdestp = NULL;
6069 		}
6070 	} else if (frp && frp->fcipr_state == PORT_DEVICE_LOGGED_IN) {
6071 		/*
6072 		 * Prepare a dest structure to return to caller
6073 		 */
6074 		fdestp = fcip_add_dest(fptr, frp);
6075 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
6076 		    (CE_NOTE, "in fcip get dest non fabric"));
6077 	}
6078 	return (fdestp);
6079 }
6080 
6081 
6082 /*
6083  * Endian clean WWN compare.
6084  * Returns 0 if they compare OK, else return non zero value.
6085  * flag can be bitwise OR of FCIP_COMPARE_NWWN, FCIP_COMPARE_PWWN,
6086  * FCIP_COMPARE_BROADCAST.
6087  */
6088 static int
6089 fcip_wwn_compare(la_wwn_t *wwn1, la_wwn_t *wwn2, int flag)
6090 {
6091 	int rval = 0;
6092 	if ((wwn1->raw_wwn[2] != wwn2->raw_wwn[2]) ||
6093 	    (wwn1->raw_wwn[3] != wwn2->raw_wwn[3]) ||
6094 	    (wwn1->raw_wwn[4] != wwn2->raw_wwn[4]) ||
6095 	    (wwn1->raw_wwn[5] != wwn2->raw_wwn[5]) ||
6096 	    (wwn1->raw_wwn[6] != wwn2->raw_wwn[6]) ||
6097 	    (wwn1->raw_wwn[7] != wwn2->raw_wwn[7])) {
6098 		rval = 1;
6099 	} else if ((flag == FCIP_COMPARE_PWWN) &&
6100 	    (((wwn1->raw_wwn[0] & 0xf0) != (wwn2->raw_wwn[0] & 0xf0)) ||
6101 	    (wwn1->raw_wwn[1] != wwn2->raw_wwn[1]))) {
6102 		rval = 1;
6103 	}
6104 	return (rval);
6105 }
6106 
6107 
6108 /*
6109  * Add an entry for a remote port in the dest hash table. Dest hash table
6110  * has entries for ports in the routing hash table with which we decide
6111  * to establish IP communication with. The no. of entries in the dest hash
6112  * table must always be less than or equal to the entries in the routing
6113  * hash table. Every entry in the dest hash table ofcourse must have a
6114  * corresponding entry in the routing hash table
6115  */
6116 static struct fcip_dest *
6117 fcip_add_dest(struct fcip *fptr, struct fcip_routing_table *frp)
6118 {
6119 	struct fcip_dest *fdestp = NULL;
6120 	la_wwn_t	*pwwn;
6121 	int hash_bucket;
6122 	struct fcip_dest *fdest_new;
6123 
6124 	if (frp == NULL) {
6125 		return (fdestp);
6126 	}
6127 
6128 	pwwn = &frp->fcipr_pwwn;
6129 	mutex_enter(&fptr->fcip_dest_mutex);
6130 	hash_bucket = FCIP_DEST_HASH(pwwn->raw_wwn);
6131 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
6132 	    (CE_NOTE, "add dest hash_bucket: 0x%x", hash_bucket));
6133 
6134 	ASSERT(hash_bucket < FCIP_DEST_HASH_ELEMS);
6135 
6136 	fdestp = fptr->fcip_dest[hash_bucket];
6137 	while (fdestp != NULL) {
6138 		mutex_enter(&fdestp->fcipd_mutex);
6139 		if (fdestp->fcipd_rtable) {
6140 			if (fcip_wwn_compare(pwwn, &fdestp->fcipd_pwwn,
6141 			    FCIP_COMPARE_PWWN) == 0) {
6142 				mutex_exit(&fdestp->fcipd_mutex);
6143 				mutex_exit(&fptr->fcip_dest_mutex);
6144 				return (fdestp);
6145 			}
6146 		}
6147 		mutex_exit(&fdestp->fcipd_mutex);
6148 		fdestp = fdestp->fcipd_next;
6149 	}
6150 
6151 	ASSERT(fdestp == NULL);
6152 
6153 	fdest_new = (struct fcip_dest *)
6154 			kmem_zalloc(sizeof (struct fcip_dest), KM_SLEEP);
6155 
6156 	mutex_init(&fdest_new->fcipd_mutex, NULL, MUTEX_DRIVER, NULL);
6157 	fdest_new->fcipd_next = fptr->fcip_dest[hash_bucket];
6158 	fdest_new->fcipd_refcnt = 0;
6159 	fdest_new->fcipd_rtable = frp;
6160 	fdest_new->fcipd_ncmds = 0;
6161 	fptr->fcip_dest[hash_bucket] = fdest_new;
6162 	fdest_new->fcipd_flags = FCIP_PORT_NOTLOGGED;
6163 
6164 	mutex_exit(&fptr->fcip_dest_mutex);
6165 	return (fdest_new);
6166 }
6167 
6168 /*
6169  * Cleanup the dest hash table and remove all entries
6170  */
6171 static void
6172 fcip_cleanup_dest(struct fcip *fptr)
6173 {
6174 	struct fcip_dest *fdestp = NULL;
6175 	struct fcip_dest *fdest_delp = NULL;
6176 	int i;
6177 
6178 	mutex_enter(&fptr->fcip_dest_mutex);
6179 
6180 	for (i = 0; i < FCIP_DEST_HASH_ELEMS; i++) {
6181 		fdestp = fptr->fcip_dest[i];
6182 		while (fdestp != NULL) {
6183 			mutex_destroy(&fdestp->fcipd_mutex);
6184 			fdest_delp = fdestp;
6185 			fdestp = fdestp->fcipd_next;
6186 			kmem_free(fdest_delp, sizeof (struct fcip_dest));
6187 			fptr->fcip_dest[i] = NULL;
6188 		}
6189 	}
6190 	mutex_exit(&fptr->fcip_dest_mutex);
6191 }
6192 
6193 
6194 /*
6195  * Send FARP requests for Fabric ports when we don't have the port
6196  * we wish to talk to in our routing hash table. FARP is specially required
6197  * to talk to FC switches for inband switch management. Most FC switches
6198  * today have a switch FC IP address for IP over FC inband switch management
6199  * but the WWN and Port_ID for this traffic is not available through the
6200  * Nameservers since the switch themeselves are transparent.
6201  */
6202 /* ARGSUSED */
6203 static struct fcip_dest *
6204 fcip_do_farp(struct fcip *fptr, la_wwn_t *pwwn, char *ip_addr,
6205     size_t ip_addr_len, int flags)
6206 {
6207 	fcip_pkt_t		*fcip_pkt;
6208 	fc_packet_t		*fc_pkt;
6209 	fcip_port_info_t	*fport = fptr->fcip_port_info;
6210 	la_els_farp_t		farp_cmd;
6211 	la_els_farp_t		*fcmd;
6212 	struct fcip_dest	*fdestp = NULL;
6213 	int			rval;
6214 	clock_t			farp_lbolt;
6215 	la_wwn_t		broadcast_wwn;
6216 	struct fcip_dest	*bdestp;
6217 	struct fcip_routing_table 	*frp;
6218 
6219 	bdestp = fcip_get_dest(fptr, &broadcast_wwn);
6220 
6221 	if (bdestp == NULL) {
6222 		return (fdestp);
6223 	}
6224 
6225 	fcip_pkt = fcip_ipkt_alloc(fptr, sizeof (la_els_farp_t),
6226 	    sizeof (la_els_farp_t), bdestp->fcipd_pd, KM_SLEEP);
6227 
6228 	if (fcip_pkt == NULL) {
6229 		return (fdestp);
6230 	}
6231 
6232 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6233 	ether_to_wwn(&fcip_arpbroadcast_addr, &broadcast_wwn);
6234 
6235 	mutex_enter(&bdestp->fcipd_mutex);
6236 	if (bdestp->fcipd_rtable == NULL) {
6237 		mutex_exit(&bdestp->fcipd_mutex);
6238 		fcip_ipkt_free(fcip_pkt);
6239 		return (fdestp);
6240 	}
6241 
6242 	fcip_pkt->fcip_pkt_dest = bdestp;
6243 	fc_pkt->pkt_fca_device = bdestp->fcipd_fca_dev;
6244 
6245 	bdestp->fcipd_ncmds++;
6246 	mutex_exit(&bdestp->fcipd_mutex);
6247 
6248 	fcip_init_broadcast_pkt(fcip_pkt, NULL, 1);
6249 	fcip_pkt->fcip_pkt_flags |= FCIP_PKT_IN_LIST;
6250 
6251 	/*
6252 	 * Now initialize the FARP payload itself
6253 	 */
6254 	fcmd = &farp_cmd;
6255 	fcmd->ls_code.ls_code = LA_ELS_FARP_REQ;
6256 	fcmd->ls_code.mbz = 0;
6257 	/*
6258 	 * for now just match the Port WWN since the other match addr
6259 	 * code points are optional. We can explore matching the IP address
6260 	 * if needed
6261 	 */
6262 	if (ip_addr) {
6263 		fcmd->match_addr = FARP_MATCH_WW_PN_IPv4;
6264 	} else {
6265 		fcmd->match_addr = FARP_MATCH_WW_PN;
6266 	}
6267 
6268 	/*
6269 	 * Request the responder port to log into us - that way
6270 	 * the Transport is aware of the remote port when we create
6271 	 * an entry for it in our tables
6272 	 */
6273 	fcmd->resp_flags = FARP_INIT_REPLY | FARP_INIT_P_LOGI;
6274 	fcmd->req_id = fport->fcipp_sid;
6275 	fcmd->dest_id.port_id = fc_pkt->pkt_cmd_fhdr.d_id;
6276 	bcopy(&fport->fcipp_pwwn, &fcmd->req_pwwn, sizeof (la_wwn_t));
6277 	bcopy(&fport->fcipp_nwwn, &fcmd->req_nwwn, sizeof (la_wwn_t));
6278 	bcopy(pwwn, &fcmd->resp_pwwn, sizeof (la_wwn_t));
6279 	/*
6280 	 * copy in source IP address if we get to know it
6281 	 */
6282 	if (ip_addr) {
6283 		bcopy(ip_addr, fcmd->resp_ip, ip_addr_len);
6284 	}
6285 
6286 	fc_pkt->pkt_cmdlen = sizeof (la_els_farp_t);
6287 	fc_pkt->pkt_rsplen = sizeof (la_els_farp_t);
6288 	fc_pkt->pkt_tran_type = FC_PKT_EXCHANGE;
6289 	fc_pkt->pkt_ulp_private = (opaque_t)fcip_pkt;
6290 
6291 	/*
6292 	 * Endian safe copy
6293 	 */
6294 	FCIP_CP_OUT(fcmd, fc_pkt->pkt_cmd, fc_pkt->pkt_cmd_acc,
6295 	    sizeof (la_els_farp_t));
6296 
6297 	/*
6298 	 * send the packet in polled mode.
6299 	 */
6300 	rval = fc_ulp_issue_els(fport->fcipp_handle, fc_pkt);
6301 	if (rval != FC_SUCCESS) {
6302 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_WARN,
6303 		    "fcip_transport of farp pkt failed 0x%x", rval));
6304 		fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_LIST;
6305 		fcip_ipkt_free(fcip_pkt);
6306 
6307 		mutex_enter(&bdestp->fcipd_mutex);
6308 		bdestp->fcipd_ncmds--;
6309 		mutex_exit(&bdestp->fcipd_mutex);
6310 
6311 		return (fdestp);
6312 	}
6313 
6314 	farp_lbolt = ddi_get_lbolt();
6315 	farp_lbolt += drv_usectohz(FCIP_FARP_TIMEOUT);
6316 
6317 	mutex_enter(&fptr->fcip_mutex);
6318 	fptr->fcip_farp_rsp_flag = 0;
6319 	while (!fptr->fcip_farp_rsp_flag) {
6320 		if (cv_timedwait(&fptr->fcip_farp_cv, &fptr->fcip_mutex,
6321 		    farp_lbolt) == -1) {
6322 			/*
6323 			 * No FARP response from any destination port
6324 			 * so bail out.
6325 			 */
6326 			fptr->fcip_farp_rsp_flag = 1;
6327 		} else {
6328 			/*
6329 			 * We received a FARP response - check to see if the
6330 			 * response was in reply to our FARP request.
6331 			 */
6332 
6333 			mutex_enter(&fptr->fcip_rt_mutex);
6334 			frp = fcip_lookup_rtable(fptr, pwwn, FCIP_COMPARE_NWWN);
6335 			mutex_exit(&fptr->fcip_rt_mutex);
6336 
6337 			if ((frp != NULL) &&
6338 			    !FCIP_RTE_UNAVAIL(frp->fcipr_state)) {
6339 				fdestp = fcip_get_dest(fptr, pwwn);
6340 			} else {
6341 				/*
6342 				 * Not our FARP response so go back and wait
6343 				 * again till FARP_TIMEOUT expires
6344 				 */
6345 				fptr->fcip_farp_rsp_flag = 0;
6346 			}
6347 		}
6348 	}
6349 	mutex_exit(&fptr->fcip_mutex);
6350 
6351 	fcip_pkt->fcip_pkt_flags |= FCIP_PKT_IN_LIST;
6352 	fcip_ipkt_free(fcip_pkt);
6353 	mutex_enter(&bdestp->fcipd_mutex);
6354 	bdestp->fcipd_ncmds--;
6355 	mutex_exit(&bdestp->fcipd_mutex);
6356 	return (fdestp);
6357 }
6358 
6359 
6360 
6361 /*
6362  * Helper routine to PLOGI to a remote port we wish to talk to.
6363  * This may not be required since the port driver does logins anyway,
6364  * but this can be required in fabric cases since FARP requests/responses
6365  * don't require you to be logged in?
6366  */
6367 
6368 /* ARGSUSED */
6369 static int
6370 fcip_do_plogi(struct fcip *fptr, struct fcip_routing_table *frp)
6371 {
6372 	fcip_pkt_t		*fcip_pkt;
6373 	fc_packet_t		*fc_pkt;
6374 	fcip_port_info_t	*fport = fptr->fcip_port_info;
6375 	la_els_logi_t		logi;
6376 	int			rval;
6377 	fc_frame_hdr_t		*fr_hdr;
6378 
6379 	/*
6380 	 * Don't bother to login for broadcast RTE entries
6381 	 */
6382 	if ((frp->fcipr_d_id.port_id == 0x0) ||
6383 	    (frp->fcipr_d_id.port_id == 0xffffff)) {
6384 		return (FC_FAILURE);
6385 	}
6386 
6387 	/*
6388 	 * We shouldn't pound in too many logins here
6389 	 *
6390 	 */
6391 	if (frp->fcipr_state == FCIP_RT_LOGIN_PROGRESS ||
6392 	    frp->fcipr_state == PORT_DEVICE_LOGGED_IN) {
6393 		return (FC_SUCCESS);
6394 	}
6395 
6396 	fcip_pkt = fcip_ipkt_alloc(fptr, sizeof (la_els_logi_t),
6397 	    sizeof (la_els_logi_t), frp->fcipr_pd, KM_SLEEP);
6398 
6399 	if (fcip_pkt == NULL) {
6400 		return (FC_FAILURE);
6401 	}
6402 
6403 	/*
6404 	 * Update back pointer for login state update
6405 	 */
6406 	fcip_pkt->fcip_pkt_frp = frp;
6407 	frp->fcipr_state = FCIP_RT_LOGIN_PROGRESS;
6408 
6409 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6410 
6411 	/*
6412 	 * Initialize frame header for ELS
6413 	 */
6414 	fr_hdr = &fc_pkt->pkt_cmd_fhdr;
6415 	fr_hdr->r_ctl = R_CTL_ELS_REQ;
6416 	fr_hdr->type = FC_TYPE_EXTENDED_LS;
6417 	fr_hdr->f_ctl = F_CTL_SEQ_INITIATIVE | F_CTL_FIRST_SEQ;
6418 	fr_hdr->df_ctl = 0;
6419 	fr_hdr->s_id = fport->fcipp_sid.port_id;
6420 	fr_hdr->d_id = frp->fcipr_d_id.port_id;
6421 	fr_hdr->seq_cnt = 0;
6422 	fr_hdr->ox_id = 0xffff;
6423 	fr_hdr->rx_id = 0xffff;
6424 	fr_hdr->ro = 0;
6425 
6426 	fc_pkt->pkt_rsplen = sizeof (la_els_logi_t);
6427 	fc_pkt->pkt_comp = fcip_ipkt_callback;
6428 	fc_pkt->pkt_tran_type = FC_PKT_EXCHANGE;
6429 	fc_pkt->pkt_timeout = 10;	/* 10 seconds */
6430 	fcip_pkt->fcip_pkt_ttl = fptr->fcip_timeout_ticks + fc_pkt->pkt_timeout;
6431 	fc_pkt->pkt_ulp_private = (opaque_t)fcip_pkt;
6432 
6433 	/*
6434 	 * Everybody does class 3, so let's just set it.  If the transport
6435 	 * knows better, it will deal with the class appropriately.
6436 	 */
6437 
6438 	fc_pkt->pkt_tran_flags = FC_TRAN_INTR | FC_TRAN_CLASS3;
6439 
6440 	/*
6441 	 * we need only fill in the ls_code and the cmd frame header
6442 	 */
6443 	bzero((void *)&logi, sizeof (la_els_logi_t));
6444 	logi.ls_code.ls_code = LA_ELS_PLOGI;
6445 	logi.ls_code.mbz = 0;
6446 
6447 	FCIP_CP_OUT((uint8_t *)&logi, fc_pkt->pkt_cmd, fc_pkt->pkt_cmd_acc,
6448 	    sizeof (la_els_logi_t));
6449 
6450 	rval = fc_ulp_login(fport->fcipp_handle, &fc_pkt, 1);
6451 	if (rval != FC_SUCCESS) {
6452 		cmn_err(CE_WARN,
6453 		    "!fc_ulp_login failed for d_id: 0x%x, rval: 0x%x",
6454 		    frp->fcipr_d_id.port_id, rval);
6455 		fcip_ipkt_free(fcip_pkt);
6456 	}
6457 	return (rval);
6458 }
6459 
6460 /*
6461  * The packet callback routine - called from the transport/FCA after
6462  * it is done DMA'ing/sending out the packet contents on the wire so
6463  * that the alloc'ed packet can be freed
6464  */
6465 static void
6466 fcip_ipkt_callback(fc_packet_t *fc_pkt)
6467 {
6468 	ls_code_t			logi_req;
6469 	ls_code_t			logi_resp;
6470 	fcip_pkt_t			*fcip_pkt;
6471 	fc_frame_hdr_t			*fr_hdr;
6472 	struct fcip 			*fptr;
6473 	fcip_port_info_t		*fport;
6474 	struct fcip_routing_table	*frp;
6475 
6476 	fr_hdr = &fc_pkt->pkt_cmd_fhdr;
6477 
6478 	FCIP_CP_IN(fc_pkt->pkt_resp, (uint8_t *)&logi_resp,
6479 	    fc_pkt->pkt_resp_acc, sizeof (logi_resp));
6480 
6481 	FCIP_CP_IN(fc_pkt->pkt_cmd, (uint8_t *)&logi_req, fc_pkt->pkt_cmd_acc,
6482 	    sizeof (logi_req));
6483 
6484 	fcip_pkt = (fcip_pkt_t *)fc_pkt->pkt_ulp_private;
6485 	frp = fcip_pkt->fcip_pkt_frp;
6486 	fptr = fcip_pkt->fcip_pkt_fptr;
6487 	fport = fptr->fcip_port_info;
6488 
6489 	ASSERT(logi_req.ls_code == LA_ELS_PLOGI);
6490 
6491 	if (fc_pkt->pkt_state != FC_PKT_SUCCESS ||
6492 	    logi_resp.ls_code != LA_ELS_ACC) {
6493 		/* EMPTY */
6494 
6495 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_WARN,
6496 		    "opcode : 0x%x to d_id: 0x%x failed",
6497 		    logi_req.ls_code, fr_hdr->d_id));
6498 
6499 		mutex_enter(&fptr->fcip_rt_mutex);
6500 		frp->fcipr_state = PORT_DEVICE_INVALID;
6501 		frp->fcipr_invalid_timeout = fptr->fcip_timeout_ticks +
6502 		    (FCIP_RTE_TIMEOUT / 2);
6503 		mutex_exit(&fptr->fcip_rt_mutex);
6504 	} else {
6505 		fc_portid_t	d_id;
6506 
6507 		d_id.port_id = fr_hdr->d_id;
6508 		d_id.priv_lilp_posit = 0;
6509 
6510 		/*
6511 		 * Update PLOGI results; FCA Handle, and Port device handles
6512 		 */
6513 		mutex_enter(&fptr->fcip_rt_mutex);
6514 		frp->fcipr_pd = fc_pkt->pkt_pd;
6515 		frp->fcipr_fca_dev =
6516 		    fc_ulp_get_fca_device(fport->fcipp_handle, d_id);
6517 		frp->fcipr_state = PORT_DEVICE_LOGGED_IN;
6518 		mutex_exit(&fptr->fcip_rt_mutex);
6519 	}
6520 
6521 	fcip_ipkt_free(fcip_pkt);
6522 }
6523 
6524 
6525 /*
6526  * pkt_alloc routine for outbound IP datagrams. The cache constructor
6527  * Only initializes the pkt_cmd_dma (which is where the outbound datagram
6528  * is stuffed) since we don't expect response
6529  */
6530 static fcip_pkt_t *
6531 fcip_pkt_alloc(struct fcip *fptr, mblk_t *bp, int flags, int datalen)
6532 {
6533 	fcip_pkt_t 	*fcip_pkt;
6534 	fc_packet_t	*fc_pkt;
6535 	ddi_dma_cookie_t	pkt_cookie;
6536 	ddi_dma_cookie_t	*cp;
6537 	uint32_t		cnt;
6538 	fcip_port_info_t	*fport = fptr->fcip_port_info;
6539 
6540 	fcip_pkt = kmem_cache_alloc(fptr->fcip_xmit_cache, flags);
6541 	if (fcip_pkt == NULL) {
6542 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM, (CE_WARN,
6543 		    "fcip_pkt_alloc: kmem_cache_alloc failed"));
6544 		return (NULL);
6545 	}
6546 
6547 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6548 	fcip_pkt->fcip_pkt_fcpktp = fc_pkt;
6549 	fc_pkt->pkt_tran_flags = 0;
6550 	fcip_pkt->fcip_pkt_dma_flags = 0;
6551 
6552 	/*
6553 	 * the cache constructor has allocated the dma handle
6554 	 */
6555 	fc_pkt->pkt_cmd = (caddr_t)bp->b_rptr;
6556 	if (ddi_dma_addr_bind_handle(fc_pkt->pkt_cmd_dma, NULL,
6557 	    (caddr_t)bp->b_rptr, datalen, DDI_DMA_WRITE | DDI_DMA_CONSISTENT,
6558 	    DDI_DMA_DONTWAIT, NULL, &pkt_cookie,
6559 	    &fc_pkt->pkt_cmd_cookie_cnt) != DDI_DMA_MAPPED) {
6560 			goto fail;
6561 	}
6562 
6563 	fcip_pkt->fcip_pkt_dma_flags |= FCIP_CMD_DMA_BOUND;
6564 
6565 	if (fc_pkt->pkt_cmd_cookie_cnt >
6566 	    fport->fcipp_cmd_dma_attr.dma_attr_sgllen) {
6567 		goto fail;
6568 	}
6569 
6570 	ASSERT(fc_pkt->pkt_cmd_cookie_cnt != 0);
6571 
6572 	cp = fc_pkt->pkt_cmd_cookie = (ddi_dma_cookie_t *)kmem_alloc(
6573 	    fc_pkt->pkt_cmd_cookie_cnt * sizeof (pkt_cookie),
6574 	    KM_NOSLEEP);
6575 
6576 	if (cp == NULL) {
6577 		goto fail;
6578 	}
6579 
6580 	*cp = pkt_cookie;
6581 	cp++;
6582 	for (cnt = 1; cnt < fc_pkt->pkt_cmd_cookie_cnt; cnt++, cp++) {
6583 		ddi_dma_nextcookie(fc_pkt->pkt_cmd_dma, &pkt_cookie);
6584 		*cp = pkt_cookie;
6585 	}
6586 
6587 	fc_pkt->pkt_cmdlen = datalen;
6588 
6589 	fcip_pkt->fcip_pkt_mp = NULL;
6590 	fcip_pkt->fcip_pkt_wq = NULL;
6591 	fcip_pkt->fcip_pkt_dest = NULL;
6592 	fcip_pkt->fcip_pkt_next = NULL;
6593 	fcip_pkt->fcip_pkt_prev = NULL;
6594 	fcip_pkt->fcip_pkt_state = 0;
6595 	fcip_pkt->fcip_pkt_reason = 0;
6596 	fcip_pkt->fcip_pkt_flags = 0;
6597 	fcip_pkt->fcip_pkt_frp = NULL;
6598 
6599 	return (fcip_pkt);
6600 fail:
6601 	if (fcip_pkt) {
6602 		fcip_pkt_free(fcip_pkt, 0);
6603 	}
6604 	return ((fcip_pkt_t *)0);
6605 }
6606 
6607 /*
6608  * Free a packet and all its associated resources
6609  */
6610 static void
6611 fcip_pkt_free(struct fcip_pkt *fcip_pkt, int free_mblk)
6612 {
6613 	fc_packet_t	*fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6614 	struct fcip *fptr = fcip_pkt->fcip_pkt_fptr;
6615 
6616 	if (fc_pkt->pkt_cmd_cookie != NULL) {
6617 		kmem_free(fc_pkt->pkt_cmd_cookie, fc_pkt->pkt_cmd_cookie_cnt *
6618 		    sizeof (ddi_dma_cookie_t));
6619 		fc_pkt->pkt_cmd_cookie = NULL;
6620 	}
6621 
6622 	fcip_free_pkt_dma(fcip_pkt);
6623 	if (free_mblk && fcip_pkt->fcip_pkt_mp) {
6624 		freemsg(fcip_pkt->fcip_pkt_mp);
6625 		fcip_pkt->fcip_pkt_mp = NULL;
6626 	}
6627 
6628 	(void) fc_ulp_uninit_packet(fptr->fcip_port_info->fcipp_handle, fc_pkt);
6629 
6630 	kmem_cache_free(fptr->fcip_xmit_cache, (void *)fcip_pkt);
6631 }
6632 
6633 /*
6634  * Allocate a Packet for internal driver use. This is for requests
6635  * that originate from within the driver
6636  */
6637 static fcip_pkt_t *
6638 fcip_ipkt_alloc(struct fcip *fptr, int cmdlen, int resplen,
6639     opaque_t pd, int flags)
6640 {
6641 	fcip_pkt_t 		*fcip_pkt;
6642 	fc_packet_t		*fc_pkt;
6643 	int			(*cb)(caddr_t);
6644 	fcip_port_info_t	*fport = fptr->fcip_port_info;
6645 	size_t			real_len;
6646 	uint_t			held_here = 0;
6647 	ddi_dma_cookie_t	pkt_cookie;
6648 	ddi_dma_cookie_t	*cp;
6649 	uint32_t		cnt;
6650 
6651 	cb = (flags == KM_SLEEP) ? DDI_DMA_SLEEP : DDI_DMA_DONTWAIT;
6652 
6653 	fcip_pkt = kmem_zalloc((sizeof (fcip_pkt_t) +
6654 	    fport->fcipp_fca_pkt_size), flags);
6655 
6656 	if (fcip_pkt == NULL) {
6657 		FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
6658 		    (CE_WARN, "pkt alloc of ineternal pkt failed"));
6659 		goto fail;
6660 	}
6661 
6662 	fcip_pkt->fcip_pkt_flags = FCIP_PKT_INTERNAL;
6663 	fcip_pkt->fcip_pkt_fptr = fptr;
6664 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6665 	fcip_pkt->fcip_pkt_fcpktp = fc_pkt;
6666 	fc_pkt->pkt_tran_flags = 0;
6667 	fc_pkt->pkt_cmdlen = 0;
6668 	fc_pkt->pkt_rsplen = 0;
6669 	fc_pkt->pkt_datalen = 0;
6670 	fc_pkt->pkt_fca_private = (opaque_t)((caddr_t)fcip_pkt +
6671 	    sizeof (fcip_pkt_t));
6672 	fc_pkt->pkt_ulp_private = (opaque_t)fcip_pkt;
6673 
6674 	if (cmdlen) {
6675 		if (ddi_dma_alloc_handle(fptr->fcip_dip,
6676 		    &fport->fcipp_cmd_dma_attr, cb, NULL,
6677 		    &fc_pkt->pkt_cmd_dma) != DDI_SUCCESS) {
6678 			goto fail;
6679 		}
6680 
6681 		if (ddi_dma_mem_alloc(fc_pkt->pkt_cmd_dma, cmdlen,
6682 		    &fport->fcipp_fca_acc_attr, DDI_DMA_CONSISTENT,
6683 		    cb, NULL, (caddr_t *)&fc_pkt->pkt_cmd,
6684 		    &real_len, &fc_pkt->pkt_cmd_acc) != DDI_SUCCESS) {
6685 			goto fail;
6686 		}
6687 
6688 		fcip_pkt->fcip_pkt_dma_flags |= FCIP_CMD_DMA_MEM;
6689 		fc_pkt->pkt_cmdlen = cmdlen;
6690 
6691 		if (real_len < cmdlen) {
6692 			goto fail;
6693 		}
6694 
6695 		if (ddi_dma_addr_bind_handle(fc_pkt->pkt_cmd_dma, NULL,
6696 		    (caddr_t)fc_pkt->pkt_cmd, real_len,
6697 		    DDI_DMA_WRITE | DDI_DMA_CONSISTENT, cb, NULL,
6698 		    &pkt_cookie, &fc_pkt->pkt_cmd_cookie_cnt) !=
6699 		    DDI_DMA_MAPPED) {
6700 			goto fail;
6701 		}
6702 
6703 		fcip_pkt->fcip_pkt_dma_flags |= FCIP_CMD_DMA_BOUND;
6704 
6705 		if (fc_pkt->pkt_cmd_cookie_cnt >
6706 		    fport->fcipp_cmd_dma_attr.dma_attr_sgllen) {
6707 			goto fail;
6708 		}
6709 
6710 		ASSERT(fc_pkt->pkt_cmd_cookie_cnt != 0);
6711 
6712 		cp = fc_pkt->pkt_cmd_cookie = (ddi_dma_cookie_t *)kmem_alloc(
6713 		    fc_pkt->pkt_cmd_cookie_cnt * sizeof (pkt_cookie),
6714 		    KM_NOSLEEP);
6715 
6716 		if (cp == NULL) {
6717 			goto fail;
6718 		}
6719 
6720 		*cp = pkt_cookie;
6721 		cp++;
6722 		for (cnt = 1; cnt < fc_pkt->pkt_cmd_cookie_cnt; cnt++, cp++) {
6723 			ddi_dma_nextcookie(fc_pkt->pkt_cmd_dma, &pkt_cookie);
6724 			*cp = pkt_cookie;
6725 		}
6726 	}
6727 
6728 	if (resplen) {
6729 		if (ddi_dma_alloc_handle(fptr->fcip_dip,
6730 		    &fport->fcipp_resp_dma_attr, cb, NULL,
6731 		    &fc_pkt->pkt_resp_dma) != DDI_SUCCESS) {
6732 			goto fail;
6733 		}
6734 
6735 		if (ddi_dma_mem_alloc(fc_pkt->pkt_resp_dma, resplen,
6736 		    &fport->fcipp_fca_acc_attr, DDI_DMA_CONSISTENT,
6737 		    cb, NULL, (caddr_t *)&fc_pkt->pkt_resp,
6738 		    &real_len, &fc_pkt->pkt_resp_acc) != DDI_SUCCESS) {
6739 			goto fail;
6740 		}
6741 
6742 		fcip_pkt->fcip_pkt_dma_flags |= FCIP_RESP_DMA_MEM;
6743 
6744 		if (real_len < resplen) {
6745 			goto fail;
6746 		}
6747 
6748 		if (ddi_dma_addr_bind_handle(fc_pkt->pkt_resp_dma, NULL,
6749 		    (caddr_t)fc_pkt->pkt_resp, real_len,
6750 		    DDI_DMA_WRITE | DDI_DMA_CONSISTENT, cb, NULL,
6751 		    &pkt_cookie, &fc_pkt->pkt_resp_cookie_cnt) !=
6752 		    DDI_DMA_MAPPED) {
6753 			goto fail;
6754 		}
6755 
6756 		fcip_pkt->fcip_pkt_dma_flags |= FCIP_RESP_DMA_BOUND;
6757 		fc_pkt->pkt_rsplen = resplen;
6758 
6759 		if (fc_pkt->pkt_resp_cookie_cnt >
6760 		    fport->fcipp_resp_dma_attr.dma_attr_sgllen) {
6761 			goto fail;
6762 		}
6763 
6764 		ASSERT(fc_pkt->pkt_resp_cookie_cnt != 0);
6765 
6766 		cp = fc_pkt->pkt_resp_cookie = (ddi_dma_cookie_t *)kmem_alloc(
6767 		    fc_pkt->pkt_resp_cookie_cnt * sizeof (pkt_cookie),
6768 		    KM_NOSLEEP);
6769 
6770 		if (cp == NULL) {
6771 			goto fail;
6772 		}
6773 
6774 		*cp = pkt_cookie;
6775 		cp++;
6776 		for (cnt = 1; cnt < fc_pkt->pkt_resp_cookie_cnt; cnt++, cp++) {
6777 			ddi_dma_nextcookie(fc_pkt->pkt_resp_dma, &pkt_cookie);
6778 			*cp = pkt_cookie;
6779 		}
6780 	}
6781 
6782 	/*
6783 	 * Initialize pkt_pd prior to calling fc_ulp_init_packet
6784 	 */
6785 
6786 	fc_pkt->pkt_pd = pd;
6787 
6788 	/*
6789 	 * Ask the FCA to bless the internal packet
6790 	 */
6791 	if (fc_ulp_init_packet((opaque_t)fport->fcipp_handle,
6792 	    fc_pkt, flags) != FC_SUCCESS) {
6793 		goto fail;
6794 	}
6795 
6796 	/*
6797 	 * Keep track of # of ipkts alloc-ed
6798 	 * This function can get called with mutex either held or not. So, we'll
6799 	 * grab mutex if it is not already held by this thread.
6800 	 * This has to be cleaned up someday.
6801 	 */
6802 	if (!MUTEX_HELD(&fptr->fcip_mutex)) {
6803 		held_here = 1;
6804 		mutex_enter(&fptr->fcip_mutex);
6805 	}
6806 
6807 	fptr->fcip_num_ipkts_pending++;
6808 
6809 	if (held_here)
6810 		mutex_exit(&fptr->fcip_mutex);
6811 
6812 	return (fcip_pkt);
6813 fail:
6814 	if (fcip_pkt) {
6815 		fcip_ipkt_free(fcip_pkt);
6816 	}
6817 
6818 	return (NULL);
6819 }
6820 
6821 /*
6822  * free up an internal IP packet (like a FARP pkt etc)
6823  */
6824 static void
6825 fcip_ipkt_free(fcip_pkt_t *fcip_pkt)
6826 {
6827 	fc_packet_t		*fc_pkt;
6828 	struct fcip		*fptr = fcip_pkt->fcip_pkt_fptr;
6829 	fcip_port_info_t	*fport = fptr->fcip_port_info;
6830 
6831 	ASSERT(fptr != NULL);
6832 	ASSERT(!mutex_owned(&fptr->fcip_mutex));
6833 
6834 	/* One less ipkt to wait for */
6835 	mutex_enter(&fptr->fcip_mutex);
6836 	if (fptr->fcip_num_ipkts_pending)	/* Safety check */
6837 		fptr->fcip_num_ipkts_pending--;
6838 	mutex_exit(&fptr->fcip_mutex);
6839 
6840 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6841 
6842 	if (fc_pkt->pkt_cmd_cookie != NULL) {
6843 		kmem_free(fc_pkt->pkt_cmd_cookie, fc_pkt->pkt_cmd_cookie_cnt *
6844 		    sizeof (ddi_dma_cookie_t));
6845 		fc_pkt->pkt_cmd_cookie = NULL;
6846 	}
6847 
6848 	if (fc_pkt->pkt_resp_cookie != NULL) {
6849 		kmem_free(fc_pkt->pkt_resp_cookie, fc_pkt->pkt_resp_cookie_cnt *
6850 		    sizeof (ddi_dma_cookie_t));
6851 		fc_pkt->pkt_resp_cookie = NULL;
6852 	}
6853 
6854 	if (fc_ulp_uninit_packet(fport->fcipp_handle, fc_pkt) != FC_SUCCESS) {
6855 		FCIP_DEBUG(FCIP_DEBUG_ELS, (CE_WARN,
6856 		    "fc_ulp_uninit_pkt failed for internal fc pkt 0x%p",
6857 		    (void *)fc_pkt));
6858 	}
6859 	fcip_free_pkt_dma(fcip_pkt);
6860 	kmem_free(fcip_pkt, (sizeof (fcip_pkt_t) + fport->fcipp_fca_pkt_size));
6861 }
6862 
6863 /*
6864  * initialize a unicast request. This is a misnomer because even the
6865  * broadcast requests are initialized with this routine
6866  */
6867 static void
6868 fcip_init_unicast_pkt(fcip_pkt_t *fcip_pkt, fc_portid_t sid, fc_portid_t did,
6869     void (*comp) ())
6870 {
6871 	fc_packet_t		*fc_pkt;
6872 	fc_frame_hdr_t		*fr_hdr;
6873 	struct fcip		*fptr = fcip_pkt->fcip_pkt_fptr;
6874 
6875 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6876 	fr_hdr = &fc_pkt->pkt_cmd_fhdr;
6877 
6878 	fr_hdr->r_ctl = R_CTL_DEVICE_DATA | R_CTL_UNSOL_DATA;
6879 	fr_hdr->s_id = sid.port_id;
6880 	fr_hdr->d_id = did.port_id;
6881 	fr_hdr->type = FC_TYPE_IS8802_SNAP;
6882 	fr_hdr->f_ctl = F_CTL_FIRST_SEQ | F_CTL_LAST_SEQ;
6883 	fr_hdr->df_ctl = DF_CTL_NET_HDR;
6884 	fr_hdr->seq_cnt = 0;
6885 	fr_hdr->ox_id = 0xffff;
6886 	fr_hdr->rx_id = 0xffff;
6887 	fr_hdr->ro = 0;
6888 	/*
6889 	 * reset all the length fields
6890 	 */
6891 	fc_pkt->pkt_rsplen = 0;
6892 	fc_pkt->pkt_datalen = 0;
6893 	fc_pkt->pkt_comp = comp;
6894 	if (comp) {
6895 		fc_pkt->pkt_tran_flags |= FC_TRAN_INTR;
6896 	} else {
6897 		fc_pkt->pkt_tran_flags |= FC_TRAN_NO_INTR;
6898 	}
6899 	fc_pkt->pkt_tran_type = FC_PKT_OUTBOUND | FC_PKT_IP_WRITE;
6900 	fc_pkt->pkt_timeout = fcip_pkt_ttl_ticks;
6901 	fcip_pkt->fcip_pkt_ttl = fptr->fcip_timeout_ticks + fc_pkt->pkt_timeout;
6902 }
6903 
6904 
6905 /*
6906  * Initialize a fcip_packet for broadcast data transfers
6907  */
6908 static void
6909 fcip_init_broadcast_pkt(fcip_pkt_t *fcip_pkt, void (*comp) (), int is_els)
6910 {
6911 	fc_packet_t		*fc_pkt;
6912 	fc_frame_hdr_t		*fr_hdr;
6913 	struct fcip		*fptr = fcip_pkt->fcip_pkt_fptr;
6914 	fcip_port_info_t	*fport = fptr->fcip_port_info;
6915 	uint32_t		sid;
6916 	uint32_t		did;
6917 
6918 	FCIP_TNF_PROBE_1((fcip_init_broadcast_pkt, "fcip io", /* CSTYLED */,
6919 		tnf_string, msg, "enter"));
6920 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6921 	fr_hdr = &fc_pkt->pkt_cmd_fhdr;
6922 	sid = fport->fcipp_sid.port_id;
6923 
6924 	if (is_els) {
6925 		fr_hdr->r_ctl = R_CTL_ELS_REQ;
6926 	} else {
6927 		fr_hdr->r_ctl = R_CTL_DEVICE_DATA | R_CTL_UNSOL_DATA;
6928 	}
6929 	fr_hdr->s_id = sid;
6930 	/*
6931 	 * The destination broadcast address depends on the topology
6932 	 * of the underlying port
6933 	 */
6934 	did = fptr->fcip_broadcast_did;
6935 	/*
6936 	 * mark pkt a broadcast pkt
6937 	 */
6938 	fc_pkt->pkt_tran_type = FC_PKT_BROADCAST;
6939 
6940 	fr_hdr->d_id = did;
6941 	fr_hdr->type = FC_TYPE_IS8802_SNAP;
6942 	fr_hdr->f_ctl = F_CTL_FIRST_SEQ | F_CTL_LAST_SEQ | F_CTL_END_SEQ;
6943 	fr_hdr->f_ctl &= ~(F_CTL_SEQ_INITIATIVE);
6944 	fr_hdr->df_ctl = DF_CTL_NET_HDR;
6945 	fr_hdr->seq_cnt = 0;
6946 	fr_hdr->ox_id = 0xffff;
6947 	fr_hdr->rx_id = 0xffff;
6948 	fr_hdr->ro = 0;
6949 	fc_pkt->pkt_comp = comp;
6950 
6951 	if (comp) {
6952 		fc_pkt->pkt_tran_flags |= FC_TRAN_INTR;
6953 	} else {
6954 		fc_pkt->pkt_tran_flags |= FC_TRAN_NO_INTR;
6955 	}
6956 
6957 	fc_pkt->pkt_tran_type = FC_PKT_BROADCAST;
6958 	fc_pkt->pkt_timeout = fcip_pkt_ttl_ticks;
6959 	fcip_pkt->fcip_pkt_ttl = fptr->fcip_timeout_ticks + fc_pkt->pkt_timeout;
6960 }
6961 
6962 
6963 
6964 /*
6965  * Free up all DMA resources associated with an allocated packet
6966  */
6967 static void
6968 fcip_free_pkt_dma(fcip_pkt_t *fcip_pkt)
6969 {
6970 	fc_packet_t	*fc_pkt;
6971 
6972 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
6973 
6974 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
6975 	    (CE_NOTE, "in freepktdma : flags 0x%x",
6976 	    fcip_pkt->fcip_pkt_dma_flags));
6977 
6978 	if (fcip_pkt->fcip_pkt_dma_flags & FCIP_CMD_DMA_BOUND) {
6979 		(void) ddi_dma_unbind_handle(fc_pkt->pkt_cmd_dma);
6980 	}
6981 	if (fcip_pkt->fcip_pkt_dma_flags & FCIP_CMD_DMA_MEM) {
6982 		ddi_dma_mem_free(&fc_pkt->pkt_cmd_acc);
6983 	}
6984 
6985 	if (fcip_pkt->fcip_pkt_dma_flags & FCIP_RESP_DMA_BOUND) {
6986 		(void) ddi_dma_unbind_handle(fc_pkt->pkt_resp_dma);
6987 	}
6988 	if (fcip_pkt->fcip_pkt_dma_flags & FCIP_RESP_DMA_MEM) {
6989 		ddi_dma_mem_free(&fc_pkt->pkt_resp_acc);
6990 	}
6991 	/*
6992 	 * for internal commands, we need to free up the dma handles too.
6993 	 * This is done in the cache destructor for non internal cmds
6994 	 */
6995 	if (fcip_pkt->fcip_pkt_flags & FCIP_PKT_INTERNAL) {
6996 		if (fc_pkt->pkt_cmd_dma) {
6997 			ddi_dma_free_handle(&fc_pkt->pkt_cmd_dma);
6998 		}
6999 		if (fc_pkt->pkt_resp_dma) {
7000 			ddi_dma_free_handle(&fc_pkt->pkt_resp_dma);
7001 		}
7002 	}
7003 }
7004 
7005 
7006 /*
7007  * helper routine to generate a string, given an ether addr
7008  */
7009 static void
7010 fcip_ether_to_str(struct ether_addr *e, caddr_t s)
7011 {
7012 	int i;
7013 
7014 	for (i = 0; i < sizeof (struct ether_addr); i++, s += 2) {
7015 		FCIP_DEBUG(FCIP_DEBUG_MISC,
7016 		    (CE_CONT, "0x%02X:", e->ether_addr_octet[i]));
7017 		(void) sprintf(s, "%02X", e->ether_addr_octet[i]);
7018 	}
7019 
7020 	*s = '\0';
7021 }
7022 
7023 /*
7024  * When a broadcast request comes from the upper streams modules, it
7025  * is ugly to look into every datagram to figure out if it is a broadcast
7026  * datagram or a unicast packet. Instead just add the broadcast entries
7027  * into our routing and dest tables and the standard hash table look ups
7028  * will find the entries. It is a lot cleaner this way. Also Solaris ifconfig
7029  * seems to be very ethernet specific and it requires broadcasts to the
7030  * ether broadcast addr of 0xffffffffff to succeed even though we specified
7031  * in the dl_info request that our broadcast MAC addr is 0x0000000000
7032  * (can't figure out why RFC2625 did this though). So add broadcast entries
7033  * for both MAC address
7034  */
7035 static int
7036 fcip_dest_add_broadcast_entry(struct fcip *fptr, int new_flag)
7037 {
7038 	fc_portmap_t 		map;
7039 	struct fcip_routing_table *frp;
7040 	uint32_t		did;
7041 	la_wwn_t		broadcast_wwn;
7042 
7043 	/*
7044 	 * get port_id of destination for broadcast - this is topology
7045 	 * dependent
7046 	 */
7047 	did = fptr->fcip_broadcast_did;
7048 
7049 	ether_to_wwn(&fcip_arpbroadcast_addr, &broadcast_wwn);
7050 	bcopy((void *)&broadcast_wwn, (void *)&map.map_pwwn, sizeof (la_wwn_t));
7051 	bcopy((void *)&broadcast_wwn, (void *)&map.map_nwwn, sizeof (la_wwn_t));
7052 
7053 	map.map_did.port_id = did;
7054 	map.map_hard_addr.hard_addr = did;
7055 	map.map_state = PORT_DEVICE_VALID;
7056 	if (new_flag) {
7057 		map.map_type = PORT_DEVICE_NEW;
7058 	} else {
7059 		map.map_type = PORT_DEVICE_CHANGED;
7060 	}
7061 	map.map_flags = 0;
7062 	map.map_pd = NULL;
7063 	bzero(&map.map_fc4_types, sizeof (map.map_fc4_types));
7064 	fcip_rt_update(fptr, &map, 1);
7065 	mutex_enter(&fptr->fcip_rt_mutex);
7066 	frp = fcip_lookup_rtable(fptr, &broadcast_wwn, FCIP_COMPARE_NWWN);
7067 	mutex_exit(&fptr->fcip_rt_mutex);
7068 	if (frp == NULL) {
7069 		return (FC_FAILURE);
7070 	}
7071 	(void) fcip_add_dest(fptr, frp);
7072 	/*
7073 	 * The Upper IP layers expect the traditional broadcast MAC addr
7074 	 * of 0xff ff ff ff ff ff to work too if we want to plumb the fcip
7075 	 * stream through the /etc/hostname.fcipXX file. Instead of checking
7076 	 * each phys addr for a match with fcip's ARP header broadcast
7077 	 * addr (0x00 00 00 00 00 00), its simply easier to add another
7078 	 * broadcast entry for 0xff ff ff ff ff ff.
7079 	 */
7080 	ether_to_wwn(&fcipnhbroadcastaddr, &broadcast_wwn);
7081 	bcopy((void *)&broadcast_wwn, (void *)&map.map_pwwn, sizeof (la_wwn_t));
7082 	bcopy((void *)&broadcast_wwn, (void *)&map.map_nwwn, sizeof (la_wwn_t));
7083 	fcip_rt_update(fptr, &map, 1);
7084 	mutex_enter(&fptr->fcip_rt_mutex);
7085 	frp = fcip_lookup_rtable(fptr, &broadcast_wwn, FCIP_COMPARE_NWWN);
7086 	mutex_exit(&fptr->fcip_rt_mutex);
7087 	if (frp == NULL) {
7088 		return (FC_FAILURE);
7089 	}
7090 	(void) fcip_add_dest(fptr, frp);
7091 	return (FC_SUCCESS);
7092 }
7093 
7094 /*
7095  * We need to obtain the D_ID of the broadcast port for transmitting all
7096  * our broadcast (and multicast) requests. The broadcast D_ID as we know
7097  * is dependent on the link topology
7098  */
7099 static uint32_t
7100 fcip_get_broadcast_did(struct fcip *fptr)
7101 {
7102 	fcip_port_info_t	*fport = fptr->fcip_port_info;
7103 	uint32_t		did = 0;
7104 	uint32_t		sid;
7105 
7106 	FCIP_TNF_PROBE_2((fcip_get_broadcast_did, "fcip io", /* CSTYLED */,
7107 		tnf_string, msg, "enter",
7108 		tnf_opaque, fptr, fptr));
7109 
7110 	sid = fport->fcipp_sid.port_id;
7111 
7112 	switch (fport->fcipp_topology) {
7113 
7114 	case FC_TOP_PT_PT: {
7115 		fc_portmap_t	*port_map = NULL;
7116 		uint32_t	listlen = 0;
7117 
7118 		if (fc_ulp_getportmap(fport->fcipp_handle, &port_map,
7119 		    &listlen, FC_ULP_PLOGI_DONTCARE) == FC_SUCCESS) {
7120 			FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_NOTE,
7121 			    "fcip_gpmap: listlen :  0x%x", listlen));
7122 			if (listlen == 1) {
7123 				did = port_map->map_did.port_id;
7124 			}
7125 		}
7126 		if (port_map) {
7127 			kmem_free(port_map, listlen * sizeof (fc_portmap_t));
7128 		}
7129 		if (listlen != 1) {
7130 			/* Dummy return value */
7131 			return (0x00FFFFFF);
7132 		}
7133 		break;
7134 	}
7135 
7136 	case FC_TOP_NO_NS:
7137 	/* FALLTHROUGH */
7138 	case FC_TOP_FABRIC:
7139 		/*
7140 		 * The broadcast address is the same whether or not
7141 		 * the switch/fabric contains a Name service.
7142 		 */
7143 		did = 0x00FFFFFF;
7144 		break;
7145 
7146 	case FC_TOP_PUBLIC_LOOP:
7147 		/*
7148 		 * The open replicate primitive must not be used. The
7149 		 * broadcast sequence is simply sent to ALPA 0x00. The
7150 		 * fabric controller then propagates the broadcast to all
7151 		 * other ports. The fabric propagates the broadcast by
7152 		 * using the OPNfr primitive.
7153 		 */
7154 		did = 0x00;
7155 		break;
7156 
7157 	case FC_TOP_PRIVATE_LOOP:
7158 		/*
7159 		 * The source port for broadcast in private loop mode
7160 		 * must send an OPN(fr) signal forcing all ports in the
7161 		 * loop to replicate the frames that they receive.
7162 		 */
7163 		did = 0x00FFFFFF;
7164 		break;
7165 
7166 	case FC_TOP_UNKNOWN:
7167 	/* FALLTHROUGH */
7168 	default:
7169 		did = sid;
7170 		FCIP_DEBUG(FCIP_DEBUG_INIT, (CE_WARN,
7171 		    "fcip(0x%x):unknown topology in init_broadcast_pkt",
7172 		    fptr->fcip_instance));
7173 		break;
7174 	}
7175 	FCIP_TNF_PROBE_2((fcip_get_broadcast_did, "fcip io", /* CSTYLED */,
7176 		tnf_string, msg, "return",
7177 		tnf_opaque, did, did));
7178 
7179 	return (did);
7180 }
7181 
7182 
7183 /*
7184  * fcip timeout performs 2 operations:
7185  * 1. timeout any packets sent to the FCA for which a callback hasn't
7186  *    happened. If you are wondering why we need a callback since all
7187  *    traffic in FCIP is unidirectional, hence all exchanges are unidirectional
7188  *    but wait, we can only free up the resources after we know the FCA has
7189  *    DMA'ed out the data. pretty obvious eh :)
7190  *
7191  * 2. Retire and routing table entries we marked up for retiring. This is
7192  *    to give the link a chance to recover instead of marking a port down
7193  *    when we have lost all communication with it after a link transition
7194  */
7195 static void
7196 fcip_timeout(void *arg)
7197 {
7198 	struct fcip 			*fptr = (struct fcip *)arg;
7199 	int				i;
7200 	fcip_pkt_t			*fcip_pkt;
7201 	struct fcip_dest		*fdestp;
7202 	int 				index;
7203 	struct fcip_routing_table 	*frtp;
7204 	int				dispatch_rte_removal = 0;
7205 
7206 	mutex_enter(&fptr->fcip_mutex);
7207 
7208 	fptr->fcip_flags |= FCIP_IN_TIMEOUT;
7209 	fptr->fcip_timeout_ticks += fcip_tick_incr;
7210 
7211 	if (fptr->fcip_flags & (FCIP_DETACHED | FCIP_DETACHING | \
7212 	    FCIP_SUSPENDED | FCIP_POWER_DOWN)) {
7213 		fptr->fcip_flags &= ~(FCIP_IN_TIMEOUT);
7214 		mutex_exit(&fptr->fcip_mutex);
7215 		return;
7216 	}
7217 
7218 	if (fptr->fcip_port_state == FCIP_PORT_OFFLINE) {
7219 		if (fptr->fcip_timeout_ticks > fptr->fcip_mark_offline) {
7220 			fptr->fcip_flags |= FCIP_LINK_DOWN;
7221 		}
7222 	}
7223 	if (!fptr->fcip_flags & FCIP_RTE_REMOVING) {
7224 		dispatch_rte_removal = 1;
7225 	}
7226 	mutex_exit(&fptr->fcip_mutex);
7227 
7228 	/*
7229 	 * Check if we have any Invalid routing table entries in our
7230 	 * hashtable we have marked off for deferred removal. If any,
7231 	 * we can spawn a taskq thread to do the cleanup for us. We
7232 	 * need to avoid cleanup in the timeout thread since we may
7233 	 * have to wait for outstanding commands to complete before
7234 	 * we retire a routing table entry. Also dispatch the taskq
7235 	 * thread only if we are already do not have a taskq thread
7236 	 * dispatched.
7237 	 */
7238 	if (dispatch_rte_removal) {
7239 		mutex_enter(&fptr->fcip_rt_mutex);
7240 		for (index = 0; index < FCIP_RT_HASH_ELEMS; index++) {
7241 			frtp = fptr->fcip_rtable[index];
7242 			while (frtp) {
7243 				if ((frtp->fcipr_state == FCIP_RT_INVALID) &&
7244 				    (fptr->fcip_timeout_ticks >
7245 				    frtp->fcipr_invalid_timeout)) {
7246 					/*
7247 					 * If we cannot schedule a task thread
7248 					 * let us attempt again on the next
7249 					 * tick rather than call
7250 					 * fcip_rte_remove_deferred() from here
7251 					 * directly since the routine can sleep.
7252 					 */
7253 					frtp->fcipr_state = FCIP_RT_RETIRED;
7254 
7255 					mutex_enter(&fptr->fcip_mutex);
7256 					fptr->fcip_flags |= FCIP_RTE_REMOVING;
7257 					mutex_exit(&fptr->fcip_mutex);
7258 
7259 					if (taskq_dispatch(fptr->fcip_tq,
7260 					    fcip_rte_remove_deferred, fptr,
7261 					    KM_NOSLEEP) == 0) {
7262 						/*
7263 						 * failed - so mark the entry
7264 						 * as invalid again.
7265 						 */
7266 						frtp->fcipr_state =
7267 						    FCIP_RT_INVALID;
7268 
7269 						mutex_enter(&fptr->fcip_mutex);
7270 						fptr->fcip_flags &=
7271 						    ~FCIP_RTE_REMOVING;
7272 						mutex_exit(&fptr->fcip_mutex);
7273 					}
7274 				}
7275 				frtp = frtp->fcipr_next;
7276 			}
7277 		}
7278 		mutex_exit(&fptr->fcip_rt_mutex);
7279 	}
7280 
7281 	mutex_enter(&fptr->fcip_dest_mutex);
7282 
7283 	/*
7284 	 * Now timeout any packets stuck with the transport/FCA for too long
7285 	 */
7286 	for (i = 0; i < FCIP_DEST_HASH_ELEMS; i++) {
7287 		fdestp = fptr->fcip_dest[i];
7288 		while (fdestp != NULL) {
7289 			mutex_enter(&fdestp->fcipd_mutex);
7290 			for (fcip_pkt = fdestp->fcipd_head; fcip_pkt != NULL;
7291 			    fcip_pkt = fcip_pkt->fcip_pkt_next) {
7292 				if (fcip_pkt->fcip_pkt_flags &
7293 				    (FCIP_PKT_RETURNED | FCIP_PKT_IN_TIMEOUT |
7294 				    FCIP_PKT_IN_ABORT)) {
7295 					continue;
7296 				}
7297 				if (fptr->fcip_timeout_ticks >
7298 				    fcip_pkt->fcip_pkt_ttl) {
7299 					fcip_pkt->fcip_pkt_flags |=
7300 					    FCIP_PKT_IN_TIMEOUT;
7301 
7302 					mutex_exit(&fdestp->fcipd_mutex);
7303 					if (taskq_dispatch(fptr->fcip_tq,
7304 					    fcip_pkt_timeout, fcip_pkt,
7305 					    KM_NOSLEEP) == 0) {
7306 						/*
7307 						 * timeout immediately
7308 						 */
7309 						fcip_pkt_timeout(fcip_pkt);
7310 					}
7311 					mutex_enter(&fdestp->fcipd_mutex);
7312 					/*
7313 					 * The linked list is altered because
7314 					 * of one of the following reasons:
7315 					 *	a. Timeout code dequeued a pkt
7316 					 *	b. Pkt completion happened
7317 					 *
7318 					 * So restart the spin starting at
7319 					 * the head again; This is a bit
7320 					 * excessive, but okay since
7321 					 * fcip_timeout_ticks isn't incremented
7322 					 * for this spin, we will skip the
7323 					 * not-to-be-timedout packets quickly
7324 					 */
7325 					fcip_pkt = fdestp->fcipd_head;
7326 					if (fcip_pkt == NULL) {
7327 						break;
7328 					}
7329 				}
7330 			}
7331 			mutex_exit(&fdestp->fcipd_mutex);
7332 			fdestp = fdestp->fcipd_next;
7333 		}
7334 	}
7335 	mutex_exit(&fptr->fcip_dest_mutex);
7336 
7337 	/*
7338 	 * reschedule the timeout thread
7339 	 */
7340 	mutex_enter(&fptr->fcip_mutex);
7341 
7342 	fptr->fcip_timeout_id = timeout(fcip_timeout, fptr,
7343 	    drv_usectohz(1000000));
7344 	fptr->fcip_flags &= ~(FCIP_IN_TIMEOUT);
7345 	mutex_exit(&fptr->fcip_mutex);
7346 }
7347 
7348 
7349 /*
7350  * This routine is either called from taskq or directly from fcip_timeout
7351  * does the actual job of aborting the packet
7352  */
7353 static void
7354 fcip_pkt_timeout(void *arg)
7355 {
7356 	fcip_pkt_t		*fcip_pkt = (fcip_pkt_t *)arg;
7357 	struct fcip_dest	*fdestp;
7358 	struct fcip		*fptr;
7359 	fc_packet_t		*fc_pkt;
7360 	fcip_port_info_t	*fport;
7361 	int			rval;
7362 
7363 	fdestp = fcip_pkt->fcip_pkt_dest;
7364 	fptr = fcip_pkt->fcip_pkt_fptr;
7365 	fport = fptr->fcip_port_info;
7366 	fc_pkt = FCIP_PKT_TO_FC_PKT(fcip_pkt);
7367 
7368 	/*
7369 	 * try to abort the pkt
7370 	 */
7371 	fcip_pkt->fcip_pkt_flags |= FCIP_PKT_IN_ABORT;
7372 	rval = fc_ulp_abort(fport->fcipp_handle, fc_pkt, KM_NOSLEEP);
7373 
7374 	FCIP_DEBUG(FCIP_DEBUG_DOWNSTREAM,
7375 	    (CE_NOTE, "fc_ulp_abort returns: 0x%x", rval));
7376 
7377 	if (rval == FC_SUCCESS) {
7378 		ASSERT(fdestp != NULL);
7379 
7380 		/*
7381 		 * dequeue the pkt from the dest structure pkt list
7382 		 */
7383 		fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_ABORT;
7384 		mutex_enter(&fdestp->fcipd_mutex);
7385 		rval = fcip_fdestp_dequeue_pkt(fdestp, fcip_pkt);
7386 		ASSERT(rval == 1);
7387 		mutex_exit(&fdestp->fcipd_mutex);
7388 
7389 		/*
7390 		 * Now cleanup the pkt and free the mblk
7391 		 */
7392 		fcip_pkt_free(fcip_pkt, 1);
7393 	} else {
7394 		/*
7395 		 * abort failed - just mark the pkt as done and
7396 		 * wait for it to complete in fcip_pkt_callback since
7397 		 * the pkt has already been xmitted by the FCA
7398 		 */
7399 		fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_TIMEOUT;
7400 		if (fcip_pkt->fcip_pkt_flags & FCIP_PKT_RETURNED) {
7401 			fcip_pkt->fcip_pkt_flags &= ~FCIP_PKT_IN_ABORT;
7402 			mutex_enter(&fdestp->fcipd_mutex);
7403 			rval = fcip_fdestp_dequeue_pkt(fdestp, fcip_pkt);
7404 			ASSERT(rval == 1);
7405 			mutex_exit(&fdestp->fcipd_mutex);
7406 
7407 			fcip_pkt_free(fcip_pkt, 1);
7408 		}
7409 		return;
7410 	}
7411 }
7412 
7413 
7414 /*
7415  * Remove  a routing table entry marked for deferred removal. This routine
7416  * unlike fcip_pkt_timeout, is always called from a taskq context
7417  */
7418 static void
7419 fcip_rte_remove_deferred(void *arg)
7420 {
7421 	struct fcip 			*fptr = (struct fcip *)arg;
7422 	int				hash_bucket;
7423 	struct fcip_dest 		*fdestp;
7424 	la_wwn_t			*pwwn;
7425 	int 				index;
7426 	struct fcip_routing_table 	*frtp, *frtp_next, *frtp_prev;
7427 
7428 
7429 	mutex_enter(&fptr->fcip_rt_mutex);
7430 	for (index = 0; index < FCIP_RT_HASH_ELEMS; index++) {
7431 		frtp = fptr->fcip_rtable[index];
7432 		frtp_prev = NULL;
7433 		while (frtp) {
7434 			frtp_next = frtp->fcipr_next;
7435 
7436 			if (frtp->fcipr_state == FCIP_RT_RETIRED) {
7437 
7438 				pwwn = &frtp->fcipr_pwwn;
7439 				/*
7440 				 * Get hold of destination pointer
7441 				 */
7442 				mutex_enter(&fptr->fcip_dest_mutex);
7443 
7444 				hash_bucket = FCIP_DEST_HASH(pwwn->raw_wwn);
7445 				ASSERT(hash_bucket < FCIP_DEST_HASH_ELEMS);
7446 
7447 				fdestp = fptr->fcip_dest[hash_bucket];
7448 				while (fdestp != NULL) {
7449 					mutex_enter(&fdestp->fcipd_mutex);
7450 					if (fdestp->fcipd_rtable) {
7451 						if (fcip_wwn_compare(pwwn,
7452 						    &fdestp->fcipd_pwwn,
7453 						    FCIP_COMPARE_PWWN) == 0) {
7454 							mutex_exit(
7455 							&fdestp->fcipd_mutex);
7456 							break;
7457 						}
7458 					}
7459 					mutex_exit(&fdestp->fcipd_mutex);
7460 					fdestp = fdestp->fcipd_next;
7461 				}
7462 
7463 				mutex_exit(&fptr->fcip_dest_mutex);
7464 				if (fdestp == NULL) {
7465 					frtp_prev = frtp;
7466 					frtp = frtp_next;
7467 					continue;
7468 				}
7469 
7470 				mutex_enter(&fdestp->fcipd_mutex);
7471 				if (fdestp->fcipd_ncmds) {
7472 					/*
7473 					 * Instead of waiting to drain commands
7474 					 * let us revisit this RT entry in
7475 					 * the next pass.
7476 					 */
7477 					mutex_exit(&fdestp->fcipd_mutex);
7478 					frtp_prev = frtp;
7479 					frtp = frtp_next;
7480 					continue;
7481 				}
7482 
7483 				/*
7484 				 * We are clean, so remove the RTE
7485 				 */
7486 				fdestp->fcipd_rtable = NULL;
7487 				mutex_exit(&fdestp->fcipd_mutex);
7488 
7489 				FCIP_TNF_PROBE_2((fcip_rte_remove_deferred,
7490 					"fcip io", /* CSTYLED */,
7491 					tnf_string, msg,
7492 					"remove retired routing entry",
7493 					tnf_int, index, index));
7494 
7495 				if (frtp_prev == NULL) {
7496 					/* first element */
7497 					fptr->fcip_rtable[index] =
7498 					    frtp->fcipr_next;
7499 				} else {
7500 					frtp_prev->fcipr_next =
7501 					    frtp->fcipr_next;
7502 				}
7503 				kmem_free(frtp,
7504 				    sizeof (struct fcip_routing_table));
7505 
7506 				frtp = frtp_next;
7507 			} else {
7508 				frtp_prev = frtp;
7509 				frtp = frtp_next;
7510 			}
7511 		}
7512 	}
7513 	mutex_exit(&fptr->fcip_rt_mutex);
7514 	/*
7515 	 * Clear the RTE_REMOVING flag
7516 	 */
7517 	mutex_enter(&fptr->fcip_mutex);
7518 	fptr->fcip_flags &= ~FCIP_RTE_REMOVING;
7519 	mutex_exit(&fptr->fcip_mutex);
7520 }
7521 
7522 /*
7523  * Walk through all the dest hash table entries and count up the total
7524  * no. of packets outstanding against a given port
7525  */
7526 static int
7527 fcip_port_get_num_pkts(struct fcip *fptr)
7528 {
7529 	int 			num_cmds = 0;
7530 	int 			i;
7531 	struct fcip_dest	*fdestp;
7532 
7533 	ASSERT(mutex_owned(&fptr->fcip_dest_mutex));
7534 
7535 	for (i = 0; i < FCIP_DEST_HASH_ELEMS; i++) {
7536 		fdestp = fptr->fcip_dest[i];
7537 		while (fdestp != NULL) {
7538 			mutex_enter(&fdestp->fcipd_mutex);
7539 
7540 			ASSERT(fdestp->fcipd_ncmds >= 0);
7541 
7542 			if (fdestp->fcipd_ncmds > 0) {
7543 				num_cmds += fdestp->fcipd_ncmds;
7544 			}
7545 			mutex_exit(&fdestp->fcipd_mutex);
7546 			fdestp = fdestp->fcipd_next;
7547 		}
7548 	}
7549 
7550 	return (num_cmds);
7551 }
7552 
7553 
7554 /*
7555  * Walk through the routing table for this state instance and see if there is a
7556  * PLOGI in progress for any of the entries. Return success even if we find one.
7557  */
7558 static int
7559 fcip_plogi_in_progress(struct fcip *fptr)
7560 {
7561 	int				i;
7562 	struct fcip_routing_table	*frp;
7563 
7564 	ASSERT(mutex_owned(&fptr->fcip_rt_mutex));
7565 
7566 	for (i = 0; i < FCIP_RT_HASH_ELEMS; i++) {
7567 		frp = fptr->fcip_rtable[i];
7568 		while (frp) {
7569 			if (frp->fcipr_state == FCIP_RT_LOGIN_PROGRESS) {
7570 				/* Found an entry where PLOGI is in progress */
7571 				return (1);
7572 			}
7573 			frp = frp->fcipr_next;
7574 		}
7575 	}
7576 
7577 	return (0);
7578 }
7579 
7580 /*
7581  * Walk through the fcip port global list and check if the given port exists in
7582  * the list. Returns "0" if port exists and "1" if otherwise.
7583  */
7584 static int
7585 fcip_check_port_exists(struct fcip *fptr)
7586 {
7587 	fcip_port_info_t	*cur_fport;
7588 	fcip_port_info_t	*fport;
7589 
7590 	mutex_enter(&fcip_global_mutex);
7591 	fport = fptr->fcip_port_info;
7592 	cur_fport = fcip_port_head;
7593 	while (cur_fport != NULL) {
7594 		if (cur_fport == fport) {
7595 			/* Found */
7596 			mutex_exit(&fcip_global_mutex);
7597 			return (0);
7598 		} else {
7599 			cur_fport = cur_fport->fcipp_next;
7600 		}
7601 	}
7602 	mutex_exit(&fcip_global_mutex);
7603 
7604 	return (1);
7605 }
7606 
7607 /*
7608  * Constructor to initialize the sendup elements for callback into
7609  * modules upstream
7610  */
7611 
7612 /* ARGSUSED */
7613 static int
7614 fcip_sendup_constructor(void *buf, void *arg, int flags)
7615 {
7616 	struct fcip_sendup_elem	*msg_elem = (struct fcip_sendup_elem *)buf;
7617 	fcip_port_info_t	*fport = (fcip_port_info_t *)arg;
7618 
7619 	ASSERT(fport != NULL);
7620 
7621 	msg_elem->fcipsu_mp = NULL;
7622 	msg_elem->fcipsu_func = NULL;
7623 	msg_elem->fcipsu_next = NULL;
7624 
7625 	return (FCIP_SUCCESS);
7626 }
7627