xref: /illumos-gate/usr/src/uts/common/io/hook.c (revision 1bff1300cebf1ea8e11ce928b10e208097e67f24)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2008 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  *
25  * Copyright 2018 Joyent, Inc.  All rights reserved.
26  * Copyright (c) 2016 by Delphix. All rights reserved.
27  */
28 #include <sys/param.h>
29 #include <sys/types.h>
30 #include <sys/systm.h>
31 #include <sys/errno.h>
32 #include <sys/kmem.h>
33 #include <sys/mutex.h>
34 #include <sys/condvar.h>
35 #include <sys/modctl.h>
36 #include <sys/hook_impl.h>
37 #include <sys/sdt.h>
38 #include <sys/cmn_err.h>
39 
40 /*
41  * This file provides kernel hook framework.
42  */
43 
44 static struct modldrv modlmisc = {
45 	&mod_miscops,				/* drv_modops */
46 	"Hooks Interface v1.0",			/* drv_linkinfo */
47 };
48 
49 static struct modlinkage modlinkage = {
50 	MODREV_1,				/* ml_rev */
51 	&modlmisc,				/* ml_linkage */
52 	NULL
53 };
54 
55 static const char *hook_hintvalue_none = "<none>";
56 
57 /*
58  * How it works.
59  * =============
60  * Use of the hook framework here is tied up with zones - when a new zone
61  * is created, we create a new hook_stack_t and are open to business for
62  * allowing new hook families and their events.
63  *
64  * A consumer of these hooks is expected to operate in this fashion:
65  * 1) call hook_family_add() to create a new family of hooks. It is a
66  *    current requirement that this call must be made with the value
67  *    returned from hook_stack_init, by way of infrastructure elsewhere.
68  * 2) add events to the registered family with calls to hook_event_add.
69  *
70  * At this point, the structures in place should be open to others to
71  * add hooks to the event or add notifiers for when the contents of the
72  * hook stack changes.
73  *
74  * The interesting stuff happens on teardown.
75  *
76  * It is a requirement that the provider of hook events work in the reverse
77  * order to the above, so that the first step is:
78  * 1) remove events from each hook family created earlier
79  * 2) remove hook families from the hook stack.
80  *
81  * When doing teardown of both events and families, a check is made to see
82  * if either structure is still "busy". If so then a boolean flag (FWF_DESTROY)
83  * is set to say that the structure is condemned. The presence of this flag
84  * being set must be checked for in _add()/_register()/ functions and a
85  * failure returned if it is set. It is ignored by the _find() functions
86  * because they're used by _remove()/_unregister().
87  * While setting the condemned flag when trying to delete a structure would
88  * normally be keyed from the presence of a reference count being greater
89  * than 1, in this implementation there are no reference counts required:
90  * instead the presence of objects on linked lists is taken to mean
91  * something is still "busy."
92  *
93  * ONLY the caller that adds the family and the events ever has a direct
94  * reference to the internal structures and thus ONLY it should be doing
95  * the removal of either the event or family.  In practise, what this means
96  * is that in ip_netinfo.c, we have calls to net_protocol_register(), followed
97  * by net_event_register() (these interface to hook_family_add() and
98  * hook_event_add(), respectively) that are made when we create an instance
99  * of IP and when the IP instance is shutdown/destroyed, it calls
100  * net_event_unregister() and net_protocol_unregister(), which in turn call
101  * hook_event_remove() and hook_family_remove() respectively. Nobody else
102  * is entitled to call the _unregister() functions.  It is imperative that
103  * there be only one _remove() call for every _add() call.
104  *
105  * It is possible that code which is interfacing with this hook framework
106  * won't do all the cleaning up that it needs to at the right time. While
107  * we can't prevent programmers from creating memory leaks, we can synchronise
108  * when we clean up data structures to prevent code accessing free'd memory.
109  *
110  * A simple diagram showing the ownership is as follows:
111  *
112  *  Owned       +--------------+
113  *   by         | hook_stack_t |
114  *   the        +--------------+
115  *  Instance      |
116  * - - - - - - - -|- - - - - - - - - - - - - - - - - -
117  *                V
118  *  Owned       +-------------------+     +-------------------+
119  *              | hook_family_int_t |---->| hook_family_int_t |
120  *   by         +-------------------+     +-------------------+
121  *                | \+---------------+        \+---------------+
122  *  network       |  | hook_family_t |         | hook_family_t |
123  *                V  +---------------+         +---------------+
124  *  protocol   +------------------+     +------------------+
125  *             | hook_event_int_t |---->| hook_event_int_t |
126  * (ipv4,ipv6) +------------------+     +------------------+
127  *                | \+--------------+        \+--------------+
128  *                |  | hook_event_t |         | hook_event_t |
129  *                |  +--------------+         +--------------+
130  * - - - - - - - -|- - - - - - - - - - - - - - - - - -
131  *                V
132  *  Owned      +------------+
133  *             | hook_int_t |
134  *   by        +------------+
135  *                  \+--------+
136  * the consumer      | hook_t |
137  *                   +--------+
138  *
139  * The consumers, such as IPFilter, do not have any pointers or hold any
140  * references to hook_int_t, hook_event_t or hook_event_int_t. By placing
141  * a hook on an event through net_hook_register(), an implicit reference
142  * to the hook_event_int_t is returned with a successful call.  Additionally,
143  * IPFilter does not see the hook_family_int_t or hook_family_t directly.
144  * Rather it is returned a net_handle_t (from net_protocol_lookup()) that
145  * contains a pointer to hook_family_int_t.  The structure behind the
146  * net_handle_t (struct net_data) *is* reference counted and managed
147  * appropriately.
148  *
149  * A more detailed picture that describes how the family/event structures
150  * are linked together can be found in <sys/hook_impl.h>
151  *
152  * Notification callbacks.
153  * =======================
154  * For each of the hook stack, hook family and hook event, it is possible
155  * to request notificatin of change to them. Why?
156  * First, lets equate the hook stack to an IP instance, a hook family to
157  * a network protocol and a hook event to IP packets on the input path.
158  * If a kernel module wants to apply security from the very start of
159  * things, it needs to know as soon as a new instance of networking
160  * is initiated. Whilst for the global zone, it is taken for granted that
161  * this instance will always exist before any interaction takes place,
162  * that is not true for zones running with an exclusive networking instance.
163  * Thus when a local zone is started and a new instance is created to support
164  * that, parties that wish to monitor it and apply a security policy from
165  * the onset need to be informed as early as possible - quite probably
166  * before any networking is started by the zone's boot scripts.
167  * Inside each instance, it is possible to have a number of network protocols
168  * (hook families) in operation. Inside the context of the global zone,
169  * it is possible to have code run before the kernel module providing the
170  * IP networking is loaded. From here, to apply the appropriate security,
171  * it is necessary to become informed of when IP is being configured into
172  * the zone and this is done by registering a notification callback with
173  * the hook stack for changes to it. The next step is to know when packets
174  * can be received through the physical_in, etc, events. This is achieved
175  * by registering a callback with the appropriate network protocol (or in
176  * this file, the correct hook family.) Thus when IP finally attaches a
177  * physical_in event to inet, the module looking to enforce a security
178  * policy can become aware of it being present. Of course there's no
179  * requirement for such a module to be present before all of the above
180  * happens and in such a case, it is reasonable for the same module to
181  * work after everything has been put in place. For this reason, when
182  * a notification callback is added, a series of fake callback events
183  * is generated to simulate the arrival of those entities. There is one
184  * final series of callbacks that can be registered - those to monitor
185  * actual hooks that are added or removed from an event. In practice,
186  * this is useful when there are multiple kernel modules participating
187  * in the processing of packets and there are behaviour dependencies
188  * involved, such that one kernel module might only register its hook
189  * if another is already present and also might want to remove its hook
190  * when the other disappears.
191  *
192  * If you know a kernel module will not be loaded before the infrastructure
193  * used in this file is present then it is not necessary to use this
194  * notification callback mechanism.
195  */
196 
197 /*
198  * Locking
199  * =======
200  * The use of CVW_* macros to do locking is driven by the need to allow
201  * recursive locking with read locks when we're processing packets. This
202  * is necessary because various netinfo functions need to hold read locks,
203  * by design, as they can be called in or out of packet context.
204  */
205 /*
206  * Hook internal functions
207  */
208 static hook_int_t *hook_copy(hook_t *src);
209 static hook_event_int_t *hook_event_checkdup(hook_event_t *he,
210     hook_stack_t *hks);
211 static hook_event_int_t *hook_event_copy(hook_event_t *src);
212 static hook_event_int_t *hook_event_find(hook_family_int_t *hfi, char *event);
213 static void hook_event_free(hook_event_int_t *hei, hook_family_int_t *hfi);
214 static hook_family_int_t *hook_family_copy(hook_family_t *src);
215 static hook_family_int_t *hook_family_find(char *family, hook_stack_t *hks);
216 static void hook_family_free(hook_family_int_t *hfi, hook_stack_t *hks);
217 static hook_int_t *hook_find(hook_event_int_t *hei, hook_t *h);
218 static void hook_int_free(hook_int_t *hi, netstackid_t);
219 static void hook_init(void);
220 static void hook_fini(void);
221 static void *hook_stack_init(netstackid_t stackid, netstack_t *ns);
222 static void hook_stack_fini(netstackid_t stackid, void *arg);
223 static void hook_stack_shutdown(netstackid_t stackid, void *arg);
224 static int hook_insert(hook_int_head_t *head, hook_int_t *new);
225 static void hook_insert_plain(hook_int_head_t *head, hook_int_t *new);
226 static int hook_insert_afterbefore(hook_int_head_t *head, hook_int_t *new);
227 static hook_int_t *hook_find_byname(hook_int_head_t *head, char *name);
228 static void hook_event_init_kstats(hook_family_int_t *, hook_event_int_t *);
229 static void hook_event_notify_run(hook_event_int_t *, hook_family_int_t *,
230     char *event, char *name, hook_notify_cmd_t cmd);
231 static void hook_init_kstats(hook_family_int_t *hfi, hook_event_int_t *hei,
232     hook_int_t *hi);
233 static int hook_notify_register(hook_notify_head_t *head,
234     hook_notify_fn_t callback, void *arg);
235 static int hook_notify_unregister(hook_notify_head_t *head,
236     hook_notify_fn_t callback, void **);
237 static void hook_notify_run(hook_notify_head_t *head, char *family,
238     char *event, char *name, hook_notify_cmd_t cmd);
239 static void hook_stack_notify_run(hook_stack_t *hks, char *name,
240     hook_notify_cmd_t cmd);
241 static void hook_stack_remove(hook_stack_t *hks);
242 
243 /*
244  * A list of the hook stacks is kept here because we need to enable
245  * net_instance_notify_register() to be called during the creation
246  * of a new instance. Previously hook_stack_get() would just use
247  * the netstack functions for this work but they will return NULL
248  * until the zone has been fully initialised.
249  */
250 static hook_stack_head_t hook_stacks;
251 static kmutex_t hook_stack_lock;
252 
253 /*
254  * Module entry points.
255  */
256 int
257 _init(void)
258 {
259 	int error;
260 
261 	hook_init();
262 	error = mod_install(&modlinkage);
263 	if (error != 0)
264 		hook_fini();
265 
266 	return (error);
267 }
268 
269 int
270 _fini(void)
271 {
272 	int error;
273 
274 	error = mod_remove(&modlinkage);
275 	if (error == 0)
276 		hook_fini();
277 
278 	return (error);
279 }
280 
281 int
282 _info(struct modinfo *modinfop)
283 {
284 	return (mod_info(&modlinkage, modinfop));
285 }
286 
287 /*
288  * Function:	hook_init
289  * Returns:	None
290  * Parameters:	None
291  *
292  * Initialize hooks
293  */
294 static void
295 hook_init(void)
296 {
297 	mutex_init(&hook_stack_lock, NULL, MUTEX_DRIVER, NULL);
298 	SLIST_INIT(&hook_stacks);
299 
300 	/*
301 	 * We want to be informed each time a stack is created or
302 	 * destroyed in the kernel.
303 	 */
304 	netstack_register(NS_HOOK, hook_stack_init, hook_stack_shutdown,
305 	    hook_stack_fini);
306 }
307 
308 /*
309  * Function:	hook_fini
310  * Returns:	None
311  * Parameters:	None
312  *
313  * Deinitialize hooks
314  */
315 static void
316 hook_fini(void)
317 {
318 	netstack_unregister(NS_HOOK);
319 
320 	mutex_destroy(&hook_stack_lock);
321 	ASSERT(SLIST_EMPTY(&hook_stacks));
322 }
323 
324 /*
325  * Function:	hook_wait_setflag
326  * Returns:     -1 = setting flag is disallowed, 0 = flag set and did
327  *              not have to wait (ie no lock droped), 1 = flag set but
328  *              it was necessary to drop locks to set it.
329  * Parameters:  waiter(I)  - control data structure
330  *              busyset(I) - set of flags that we don't want set while
331  *                           we are active.
332  *              wanted(I)  - flag associated with newflag to indicate
333  *                           what we want to do.
334  *              newflag(I) - the new ACTIVE flag we want to set that
335  *                           indicates what we are doing.
336  *
337  * The set of functions hook_wait_* implement an API that builds on top of
338  * the kcondvar_t to provide controlled execution through a critical region.
339  * For each flag that indicates work is being done (FWF_*_ACTIVE) there is
340  * also a flag that we set to indicate that we want to do it (FWF_*_WANTED).
341  * The combination of flags is required as when this function exits to do
342  * the task, the structure is then free for another caller to use and
343  * to indicate that it wants to do work.  The flags used when a caller wants
344  * to destroy an object take precedence over those that are used for making
345  * changes to it (add/remove.) In this case, we don't try to secure the
346  * ability to run and return with an error.
347  *
348  * "wantedset" is used here to determine who has the right to clear the
349  * wanted bit from the fw_flags set: only whomever sets the flag has the
350  * right to clear it at the bottom of the loop, even if someone else
351  * wants to set it.
352  *
353  * wanted - the FWF_*_WANTED flag that describes the action being requested
354  * busyset- the set of FWF_* flags we don't want set when we run
355  * newflag- the FWF_*_ACTIVE flag we will set to indicate we are busy
356  */
357 int
358 hook_wait_setflag(flagwait_t *waiter, uint32_t busyset, fwflag_t wanted,
359     fwflag_t newflag)
360 {
361 	boolean_t wantedset;
362 	int waited = 0;
363 
364 	mutex_enter(&waiter->fw_lock);
365 	if (waiter->fw_flags & FWF_DESTROY) {
366 		cv_signal(&waiter->fw_cv);
367 		mutex_exit(&waiter->fw_lock);
368 		return (-1);
369 	}
370 	while (waiter->fw_flags & busyset) {
371 		wantedset = ((waiter->fw_flags & wanted) == wanted);
372 		if (!wantedset)
373 			waiter->fw_flags |= wanted;
374 		CVW_EXIT_WRITE(waiter->fw_owner);
375 		cv_wait(&waiter->fw_cv, &waiter->fw_lock);
376 		/*
377 		 * This lock needs to be dropped here to preserve the order
378 		 * of acquisition that is fw_owner followed by fw_lock, else
379 		 * we can deadlock.
380 		 */
381 		mutex_exit(&waiter->fw_lock);
382 		waited = 1;
383 		CVW_ENTER_WRITE(waiter->fw_owner);
384 		mutex_enter(&waiter->fw_lock);
385 		if (!wantedset)
386 			waiter->fw_flags &= ~wanted;
387 		if (waiter->fw_flags & FWF_DESTROY) {
388 			cv_signal(&waiter->fw_cv);
389 			mutex_exit(&waiter->fw_lock);
390 			return (-1);
391 		}
392 	}
393 	waiter->fw_flags &= ~wanted;
394 	ASSERT((waiter->fw_flags & wanted) == 0);
395 	ASSERT((waiter->fw_flags & newflag) == 0);
396 	waiter->fw_flags |= newflag;
397 	mutex_exit(&waiter->fw_lock);
398 	return (waited);
399 }
400 
401 /*
402  * Function:	hook_wait_unsetflag
403  * Returns:     None
404  * Parameters:  waiter(I)  - control data structure
405  *              oldflag(I) - flag to reset
406  *
407  * Turn off the bit that we had set to run and let others know that
408  * they should now check to see if they can run.
409  */
410 void
411 hook_wait_unsetflag(flagwait_t *waiter, fwflag_t oldflag)
412 {
413 	mutex_enter(&waiter->fw_lock);
414 	waiter->fw_flags &= ~oldflag;
415 	cv_signal(&waiter->fw_cv);
416 	mutex_exit(&waiter->fw_lock);
417 }
418 
419 /*
420  * Function:	hook_wait_destroy
421  * Returns:     None
422  * Parameters:  waiter(I)  - control data structure
423  *
424  * Since outer locking (on fw_owner) should ensure that only one function
425  * at a time gets to call hook_wait_destroy() on a given object, there is
426  * no need to guard against setting FWF_DESTROY_WANTED already being set.
427  * It is, however, necessary to wait for all activity on the owning
428  * structure to cease.
429  */
430 int
431 hook_wait_destroy(flagwait_t *waiter)
432 {
433 	ASSERT((waiter->fw_flags & FWF_DESTROY_WANTED) == 0);
434 	mutex_enter(&waiter->fw_lock);
435 	if (waiter->fw_flags & FWF_DESTROY_WANTED) {
436 		cv_signal(&waiter->fw_cv);
437 		mutex_exit(&waiter->fw_lock);
438 		return (EINPROGRESS);
439 	}
440 	waiter->fw_flags |= FWF_DESTROY_WANTED;
441 	while (!FWF_DESTROY_OK(waiter)) {
442 		CVW_EXIT_WRITE(waiter->fw_owner);
443 		cv_wait(&waiter->fw_cv, &waiter->fw_lock);
444 		CVW_ENTER_WRITE(waiter->fw_owner);
445 	}
446 	/*
447 	 * There should now be nothing else using "waiter" or its
448 	 * owner, so we can safely assign here without risk of wiiping
449 	 * out someone's bit.
450 	 */
451 	waiter->fw_flags = FWF_DESTROY_ACTIVE;
452 	cv_signal(&waiter->fw_cv);
453 	mutex_exit(&waiter->fw_lock);
454 
455 	return (0);
456 }
457 
458 /*
459  * Function:	hook_wait_init
460  * Returns:     None
461  * Parameters:  waiter(I)  - control data structure
462  *              ownder(I)  - pointer to lock that the owner of this
463  *                           waiter uses
464  *
465  * "owner" gets passed in here so that when we need to call cv_wait,
466  * for example in hook_wait_setflag(), we can drop the lock for the
467  * next layer out, which is likely to be held in an exclusive manner.
468  */
469 void
470 hook_wait_init(flagwait_t *waiter, cvwaitlock_t *owner)
471 {
472 	cv_init(&waiter->fw_cv, NULL, CV_DRIVER, NULL);
473 	mutex_init(&waiter->fw_lock, NULL, MUTEX_DRIVER, NULL);
474 	waiter->fw_flags = FWF_NONE;
475 	waiter->fw_owner = owner;
476 }
477 
478 /*
479  * Function:	hook_stack_init
480  * Returns:     void *     - pointer to new hook stack structure
481  * Parameters:  stackid(I) - identifier for the network instance that owns this
482  *              ns(I)      - pointer to the network instance data structure
483  *
484  * Allocate and initialize the hook stack instance. This function is not
485  * allowed to fail, so KM_SLEEP is used here when allocating memory. The
486  * value returned is passed back into the shutdown and destroy hooks.
487  */
488 /*ARGSUSED*/
489 static void *
490 hook_stack_init(netstackid_t stackid, netstack_t *ns)
491 {
492 	hook_stack_t	*hks;
493 
494 #ifdef NS_DEBUG
495 	printf("hook_stack_init(stack %d)\n", stackid);
496 #endif
497 
498 	hks = (hook_stack_t *)kmem_zalloc(sizeof (*hks), KM_SLEEP);
499 	hks->hks_netstack = ns;
500 	hks->hks_netstackid = stackid;
501 
502 	CVW_INIT(&hks->hks_lock);
503 	TAILQ_INIT(&hks->hks_nhead);
504 	SLIST_INIT(&hks->hks_familylist);
505 
506 	hook_wait_init(&hks->hks_waiter, &hks->hks_lock);
507 
508 	mutex_enter(&hook_stack_lock);
509 	SLIST_INSERT_HEAD(&hook_stacks, hks, hks_entry);
510 	mutex_exit(&hook_stack_lock);
511 
512 	return (hks);
513 }
514 
515 /*
516  * Function:	hook_stack_shutdown
517  * Returns:     void
518  * Parameters:  stackid(I) - identifier for the network instance that owns this
519  *              arg(I)     - pointer returned by hook_stack_init
520  *
521  * Set the shutdown flag to indicate that we should stop accepting new
522  * register calls as we're now in the cleanup process. The cleanup is a
523  * two stage process and we're not required to free any memory here.
524  *
525  * The curious would wonder why isn't there any code that walks through
526  * all of the data structures and sets the flag(s) there? The answer is
527  * that it is expected that this will happen when the zone shutdown calls
528  * the shutdown callbacks for other modules that they will initiate the
529  * free'ing and shutdown of the hooks themselves.
530  */
531 /*ARGSUSED*/
532 static void
533 hook_stack_shutdown(netstackid_t stackid, void *arg)
534 {
535 	hook_stack_t *hks = (hook_stack_t *)arg;
536 
537 	mutex_enter(&hook_stack_lock);
538 	/*
539 	 * Once this flag gets set to one, no more additions are allowed
540 	 * to any of the structures that make up this stack.
541 	 */
542 	hks->hks_shutdown = 1;
543 	mutex_exit(&hook_stack_lock);
544 }
545 
546 /*
547  * Function:	hook_stack_destroy
548  * Returns:     void
549  * Parameters:  stackid(I) - identifier for the network instance that owns this
550  *              arg(I)     - pointer returned by hook_stack_init
551  *
552  * Free the hook stack instance.
553  *
554  * The rationale for the shutdown being lazy (see the comment above for
555  * hook_stack_shutdown) also applies to the destroy being lazy. Only if
556  * the hook_stack_t data structure is unused will it go away. Else it
557  * is left up to the last user of a data structure to actually free it.
558  */
559 /*ARGSUSED*/
560 static void
561 hook_stack_fini(netstackid_t stackid, void *arg)
562 {
563 	hook_stack_t *hks = (hook_stack_t *)arg;
564 
565 	mutex_enter(&hook_stack_lock);
566 	hks->hks_shutdown = 2;
567 	hook_stack_remove(hks);
568 	mutex_exit(&hook_stack_lock);
569 }
570 
571 /*
572  * Function:	hook_stack_remove
573  * Returns:     void
574  * Parameters:  hks(I) - pointer to an instance of a hook_stack_t
575  *
576  * This function assumes that it is called with hook_stack_lock held.
577  * It functions differently to hook_family/event_remove in that it does
578  * the checks to see if it can be removed. This difference exists
579  * because this structure has nothing higher up that depends on it.
580  */
581 static void
582 hook_stack_remove(hook_stack_t *hks)
583 {
584 
585 	ASSERT(mutex_owned(&hook_stack_lock));
586 
587 	/*
588 	 * Is the structure still in use?
589 	 */
590 	if (!SLIST_EMPTY(&hks->hks_familylist) ||
591 	    !TAILQ_EMPTY(&hks->hks_nhead))
592 		return;
593 
594 	SLIST_REMOVE(&hook_stacks, hks, hook_stack, hks_entry);
595 
596 	VERIFY(hook_wait_destroy(&hks->hks_waiter) == 0);
597 	CVW_DESTROY(&hks->hks_lock);
598 	kmem_free(hks, sizeof (*hks));
599 }
600 
601 /*
602  * Function:	hook_stack_get
603  * Returns:     hook_stack_t * - NULL if not found, else matching instance
604  * Parameters:  stackid(I)     - instance id to search for
605  *
606  * Search the list of currently active hook_stack_t structures for one that
607  * has a matching netstackid_t to the value passed in. The linked list can
608  * only ever have at most one match for this value.
609  */
610 static hook_stack_t *
611 hook_stack_get(netstackid_t stackid)
612 {
613 	hook_stack_t *hks;
614 
615 	SLIST_FOREACH(hks, &hook_stacks, hks_entry) {
616 		if (hks->hks_netstackid == stackid)
617 			break;
618 	}
619 
620 	return (hks);
621 }
622 
623 /*
624  * Function:	hook_stack_notify_register
625  * Returns:	int        - 0 = success, else failure
626  * Parameters:	stackid(I) - netstack identifier
627  *              callback(I)- function to be called
628  *              arg(I)     - arg to provide callback when it is called
629  *
630  * If we're not shutting down this instance, append a new function to the
631  * list of those to call when a new family of hooks is added to this stack.
632  * If the function can be successfully added to the list of callbacks
633  * activated when there is a change to the stack (addition or removal of
634  * a hook family) then generate a fake HN_REGISTER event by directly
635  * calling the callback with the relevant information for each hook
636  * family that currently exists (and isn't being shutdown.)
637  */
638 int
639 hook_stack_notify_register(netstackid_t stackid, hook_notify_fn_t callback,
640     void *arg)
641 {
642 	hook_family_int_t *hfi;
643 	hook_stack_t *hks;
644 	boolean_t canrun;
645 	char buffer[16];
646 	int error;
647 
648 	ASSERT(callback != NULL);
649 
650 	canrun = B_FALSE;
651 	mutex_enter(&hook_stack_lock);
652 	hks = hook_stack_get(stackid);
653 	if (hks != NULL) {
654 		if (hks->hks_shutdown != 0) {
655 			error = ESHUTDOWN;
656 		} else {
657 			CVW_ENTER_WRITE(&hks->hks_lock);
658 			canrun = (hook_wait_setflag(&hks->hks_waiter,
659 			    FWF_ADD_WAIT_MASK, FWF_ADD_WANTED,
660 			    FWF_ADD_ACTIVE) != -1);
661 			error = hook_notify_register(&hks->hks_nhead,
662 			    callback, arg);
663 			CVW_EXIT_WRITE(&hks->hks_lock);
664 		}
665 	} else {
666 		error = ESRCH;
667 	}
668 	mutex_exit(&hook_stack_lock);
669 
670 	if (error == 0 && canrun) {
671 		/*
672 		 * Generate fake register event for callback that
673 		 * is being added, letting it know everything that
674 		 * already exists.
675 		 */
676 		(void) snprintf(buffer, sizeof (buffer), "%u",
677 		    hks->hks_netstackid);
678 
679 		SLIST_FOREACH(hfi, &hks->hks_familylist, hfi_entry) {
680 			if (hfi->hfi_condemned || hfi->hfi_shutdown)
681 				continue;
682 			callback(HN_REGISTER, arg, buffer, NULL,
683 			    hfi->hfi_family.hf_name);
684 		}
685 	}
686 
687 	if (canrun)
688 		hook_wait_unsetflag(&hks->hks_waiter, FWF_ADD_ACTIVE);
689 
690 	return (error);
691 }
692 
693 /*
694  * Function:	hook_stack_notify_unregister
695  * Returns:	int         - 0 = success, else failure
696  * Parameters:	stackid(I)  - netstack identifier
697  *              callback(I) - function to be called
698  *
699  * Attempt to remove a registered function from a hook stack's list of
700  * callbacks to activiate when protocols are added/deleted.
701  * As with hook_stack_notify_register, if all things are going well then
702  * a fake unregister event is delivered to the callback being removed
703  * for each hook family that presently exists.
704  */
705 int
706 hook_stack_notify_unregister(netstackid_t stackid, hook_notify_fn_t callback)
707 {
708 	hook_family_int_t *hfi;
709 	hook_stack_t *hks;
710 	char buffer[16];
711 	void *arg;
712 	int error;
713 
714 	mutex_enter(&hook_stack_lock);
715 	hks = hook_stack_get(stackid);
716 	if (hks == NULL) {
717 		mutex_exit(&hook_stack_lock);
718 		return (ESRCH);
719 	}
720 
721 	CVW_ENTER_WRITE(&hks->hks_lock);
722 	/*
723 	 * If hook_wait_setflag returns -1, another thread has flagged that it
724 	 * is attempting to destroy this hook stack.  Before it can flag that
725 	 * it's destroying the hook stack, it must first verify (with
726 	 * hook_stack_lock held) that the hook stack is empty.  If we
727 	 * encounter this, it means we should have nothing to do and we
728 	 * just snuck in.
729 	 */
730 	if (hook_wait_setflag(&hks->hks_waiter, FWF_DEL_WAIT_MASK,
731 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE) == -1) {
732 		VERIFY(TAILQ_EMPTY(&hks->hks_nhead));
733 		CVW_EXIT_WRITE(&hks->hks_lock);
734 		mutex_exit(&hook_stack_lock);
735 		return (ESRCH);
736 	}
737 
738 	error = hook_notify_unregister(&hks->hks_nhead, callback, &arg);
739 	CVW_EXIT_WRITE(&hks->hks_lock);
740 	mutex_exit(&hook_stack_lock);
741 
742 	if (error == 0) {
743 		/*
744 		 * Generate fake unregister event for callback that
745 		 * is being removed, letting it know everything that
746 		 * currently exists is now "disappearing."
747 		 */
748 		(void) snprintf(buffer, sizeof (buffer), "%u",
749 		    hks->hks_netstackid);
750 
751 		SLIST_FOREACH(hfi, &hks->hks_familylist, hfi_entry) {
752 			callback(HN_UNREGISTER, arg, buffer, NULL,
753 			    hfi->hfi_family.hf_name);
754 		}
755 	} else {
756 		/*
757 		 * hook_notify_unregister() should only fail if the callback has
758 		 * already been deleted (ESRCH).
759 		 */
760 		VERIFY3S(error, ==, ESRCH);
761 	}
762 
763 	mutex_enter(&hook_stack_lock);
764 	hook_wait_unsetflag(&hks->hks_waiter, FWF_DEL_ACTIVE);
765 	if (hks->hks_shutdown == 2)
766 		hook_stack_remove(hks);
767 	mutex_exit(&hook_stack_lock);
768 
769 	return (error);
770 }
771 
772 /*
773  * Function:	hook_stack_notify_run
774  * Returns:	None
775  * Parameters:	hks(I)  - hook stack pointer to execute callbacks for
776  *              name(I) - name of a hook family
777  *              cmd(I)  - either HN_UNREGISTER or HN_REGISTER
778  *
779  * Run through the list of callbacks on the hook stack to be called when
780  * a new hook family is added
781  *
782  * As hook_notify_run() expects 3 names, one for the family that is associated
783  * with the cmd (HN_REGISTER or HN_UNREGISTER), one for the event and one
784  * for the object being introduced and we really only have one name (that
785  * of the new hook family), fake the hook stack's name by converting the
786  * integer to a string and for the event just pass NULL.
787  */
788 static void
789 hook_stack_notify_run(hook_stack_t *hks, char *name,
790     hook_notify_cmd_t cmd)
791 {
792 	char buffer[16];
793 
794 	ASSERT(hks != NULL);
795 	ASSERT(name != NULL);
796 
797 	(void) snprintf(buffer, sizeof (buffer), "%u", hks->hks_netstackid);
798 
799 	hook_notify_run(&hks->hks_nhead, buffer, NULL, name, cmd);
800 }
801 
802 /*
803  * Function:	hook_run
804  * Returns:	int      - return value according to callback func
805  * Parameters:	token(I) - event pointer
806  *		info(I)  - message
807  *
808  * Run hooks for specific provider.  The hooks registered are stepped through
809  * until either the end of the list is reached or a hook function returns a
810  * non-zero value.  If a non-zero value is returned from a hook function, we
811  * return that value back to our caller.  By design, a hook function can be
812  * called more than once, simultaneously.
813  */
814 int
815 hook_run(hook_family_int_t *hfi, hook_event_token_t token, hook_data_t info)
816 {
817 	hook_event_int_t *hei;
818 	hook_int_t *hi;
819 	int rval = 0;
820 
821 	ASSERT(token != NULL);
822 
823 	hei = (hook_event_int_t *)token;
824 	DTRACE_PROBE2(hook__run__start,
825 	    hook_event_token_t, token,
826 	    hook_data_t, info);
827 
828 	/*
829 	 * If we consider that this function is only called from within the
830 	 * stack while an instance is currently active,
831 	 */
832 	CVW_ENTER_READ(&hfi->hfi_lock);
833 
834 	TAILQ_FOREACH(hi, &hei->hei_head, hi_entry) {
835 		ASSERT(hi->hi_hook.h_func != NULL);
836 		DTRACE_PROBE3(hook__func__start,
837 		    hook_event_token_t, token,
838 		    hook_data_t, info,
839 		    hook_int_t *, hi);
840 		rval = (*hi->hi_hook.h_func)(token, info, hi->hi_hook.h_arg);
841 		DTRACE_PROBE4(hook__func__end,
842 		    hook_event_token_t, token,
843 		    hook_data_t, info,
844 		    hook_int_t *, hi,
845 		    int, rval);
846 		hi->hi_kstats.hook_hits.value.ui64++;
847 		if (rval != 0)
848 			break;
849 	}
850 
851 	hei->hei_kstats.events.value.ui64++;
852 
853 	CVW_EXIT_READ(&hfi->hfi_lock);
854 
855 	DTRACE_PROBE3(hook__run__end,
856 	    hook_event_token_t, token,
857 	    hook_data_t, info,
858 	    hook_int_t *, hi);
859 
860 	return (rval);
861 }
862 
863 /*
864  * Function:	hook_family_add
865  * Returns:	internal family pointer - NULL = Fail
866  * Parameters:	hf(I)    - family pointer
867  *              hks(I)   - pointer to an instance of a hook_stack_t
868  *              store(O) - where returned pointer will be stored
869  *
870  * Add new family to the family list. The requirements for the addition to
871  * succeed are that the family name must not already be registered and that
872  * the hook stack is not being shutdown.
873  * If store is non-NULL, it is expected to be a pointer to the same variable
874  * that is awaiting to be assigned the return value of this function.
875  * In its current use, the returned value is assigned to netd_hooks in
876  * net_family_register. The use of "store" allows the return value to be
877  * used before this function returns. How can this happen? Through the
878  * callbacks that can be activated at the bottom of this function, when
879  * hook_stack_notify_run is called.
880  */
881 hook_family_int_t *
882 hook_family_add(hook_family_t *hf, hook_stack_t *hks, void **store)
883 {
884 	hook_family_int_t *hfi, *new;
885 
886 	ASSERT(hf != NULL);
887 	ASSERT(hf->hf_name != NULL);
888 
889 	new = hook_family_copy(hf);
890 	if (new == NULL)
891 		return (NULL);
892 
893 	mutex_enter(&hook_stack_lock);
894 	CVW_ENTER_WRITE(&hks->hks_lock);
895 
896 	if (hks->hks_shutdown != 0) {
897 		CVW_EXIT_WRITE(&hks->hks_lock);
898 		mutex_exit(&hook_stack_lock);
899 		hook_family_free(new, NULL);
900 		return (NULL);
901 	}
902 
903 	/* search family list */
904 	hfi = hook_family_find(hf->hf_name, hks);
905 	if (hfi != NULL) {
906 		CVW_EXIT_WRITE(&hks->hks_lock);
907 		mutex_exit(&hook_stack_lock);
908 		hook_family_free(new, NULL);
909 		return (NULL);
910 	}
911 
912 	/*
913 	 * Try and set the FWF_ADD_ACTIVE flag so that we can drop all the
914 	 * lock further down when calling all of the functions registered
915 	 * for notification when a new hook family is added.
916 	 */
917 	if (hook_wait_setflag(&hks->hks_waiter, FWF_ADD_WAIT_MASK,
918 	    FWF_ADD_WANTED, FWF_ADD_ACTIVE) == -1) {
919 		CVW_EXIT_WRITE(&hks->hks_lock);
920 		mutex_exit(&hook_stack_lock);
921 		hook_family_free(new, NULL);
922 		return (NULL);
923 	}
924 
925 	CVW_INIT(&new->hfi_lock);
926 	SLIST_INIT(&new->hfi_head);
927 	TAILQ_INIT(&new->hfi_nhead);
928 
929 	hook_wait_init(&new->hfi_waiter, &new->hfi_lock);
930 
931 	new->hfi_stack = hks;
932 	if (store != NULL)
933 		*store = new;
934 
935 	/* Add to family list head */
936 	SLIST_INSERT_HEAD(&hks->hks_familylist, new, hfi_entry);
937 
938 	CVW_EXIT_WRITE(&hks->hks_lock);
939 	mutex_exit(&hook_stack_lock);
940 
941 	hook_stack_notify_run(hks, hf->hf_name, HN_REGISTER);
942 
943 	hook_wait_unsetflag(&hks->hks_waiter, FWF_ADD_ACTIVE);
944 
945 	return (new);
946 }
947 
948 /*
949  * Function:	hook_family_remove
950  * Returns:	int    - 0 = success, else = failure
951  * Parameters:	hfi(I) - internal family pointer
952  *
953  * Remove family from family list. This function has been designed to be
954  * called once and once only per hook_family_int_t. Thus when cleaning up
955  * this structure as an orphan, callers should only call hook_family_free.
956  */
957 int
958 hook_family_remove(hook_family_int_t *hfi)
959 {
960 	hook_stack_t *hks;
961 	boolean_t notifydone;
962 
963 	ASSERT(hfi != NULL);
964 	hks = hfi->hfi_stack;
965 
966 	CVW_ENTER_WRITE(&hfi->hfi_lock);
967 	notifydone = hfi->hfi_shutdown;
968 	hfi->hfi_shutdown = B_TRUE;
969 	CVW_EXIT_WRITE(&hfi->hfi_lock);
970 
971 	CVW_ENTER_WRITE(&hks->hks_lock);
972 
973 	if (hook_wait_setflag(&hks->hks_waiter, FWF_DEL_WAIT_MASK,
974 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE) == -1) {
975 		/*
976 		 * If we're trying to destroy the hook_stack_t...
977 		 */
978 		CVW_EXIT_WRITE(&hks->hks_lock);
979 		return (ENXIO);
980 	}
981 
982 	/*
983 	 * Check if the family is in use by the presence of either events
984 	 * or notify callbacks on the hook family.
985 	 */
986 	if (!SLIST_EMPTY(&hfi->hfi_head) || !TAILQ_EMPTY(&hfi->hfi_nhead)) {
987 		hfi->hfi_condemned = B_TRUE;
988 	} else {
989 		VERIFY(hook_wait_destroy(&hfi->hfi_waiter) == 0);
990 		/*
991 		 * Although hfi_condemned = B_FALSE is implied from creation,
992 		 * putting a comment here inside the else upsets lint.
993 		 */
994 		hfi->hfi_condemned = B_FALSE;
995 	}
996 	CVW_EXIT_WRITE(&hks->hks_lock);
997 
998 	if (!notifydone)
999 		hook_stack_notify_run(hks, hfi->hfi_family.hf_name,
1000 		    HN_UNREGISTER);
1001 
1002 	hook_wait_unsetflag(&hks->hks_waiter, FWF_DEL_ACTIVE);
1003 
1004 	/*
1005 	 * If we don't have to wait for anything else to disappear from this
1006 	 * structure then we can free it up.
1007 	 */
1008 	if (!hfi->hfi_condemned)
1009 		hook_family_free(hfi, hks);
1010 
1011 	return (0);
1012 }
1013 
1014 
1015 /*
1016  * Function:	hook_family_free
1017  * Returns:	None
1018  * Parameters:	hfi(I) - internal family pointer
1019  *
1020  * Free alloc memory for family
1021  */
1022 static void
1023 hook_family_free(hook_family_int_t *hfi, hook_stack_t *hks)
1024 {
1025 
1026 	/*
1027 	 * This lock gives us possession of the hks pointer after the
1028 	 * SLIST_REMOVE, for which it is not needed, when hks_shutdown
1029 	 * is checked and hook_stack_remove called.
1030 	 */
1031 	mutex_enter(&hook_stack_lock);
1032 
1033 	ASSERT(hfi != NULL);
1034 
1035 	if (hks != NULL) {
1036 		CVW_ENTER_WRITE(&hks->hks_lock);
1037 		/* Remove from family list */
1038 		SLIST_REMOVE(&hks->hks_familylist, hfi, hook_family_int,
1039 		    hfi_entry);
1040 
1041 		CVW_EXIT_WRITE(&hks->hks_lock);
1042 	}
1043 
1044 	/* Free name space */
1045 	if (hfi->hfi_family.hf_name != NULL) {
1046 		kmem_free(hfi->hfi_family.hf_name,
1047 		    strlen(hfi->hfi_family.hf_name) + 1);
1048 	}
1049 
1050 	/* Free container */
1051 	kmem_free(hfi, sizeof (*hfi));
1052 
1053 	if (hks->hks_shutdown == 2)
1054 		hook_stack_remove(hks);
1055 
1056 	mutex_exit(&hook_stack_lock);
1057 }
1058 
1059 /*
1060  * Function:	hook_family_shutdown
1061  * Returns:	int    - 0 = success, else = failure
1062  * Parameters:	hfi(I) - internal family pointer
1063  *
1064  * As an alternative to removing a family, we may desire to just generate
1065  * a series of callbacks to indicate that we will be going away in the
1066  * future. The hfi_condemned flag isn't set because we aren't trying to
1067  * remove the structure.
1068  */
1069 int
1070 hook_family_shutdown(hook_family_int_t *hfi)
1071 {
1072 	hook_stack_t *hks;
1073 	boolean_t notifydone;
1074 
1075 	ASSERT(hfi != NULL);
1076 	hks = hfi->hfi_stack;
1077 
1078 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1079 	notifydone = hfi->hfi_shutdown;
1080 	hfi->hfi_shutdown = B_TRUE;
1081 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1082 
1083 	CVW_ENTER_WRITE(&hks->hks_lock);
1084 
1085 	if (hook_wait_setflag(&hks->hks_waiter, FWF_DEL_WAIT_MASK,
1086 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE) == -1) {
1087 		/*
1088 		 * If we're trying to destroy the hook_stack_t...
1089 		 */
1090 		CVW_EXIT_WRITE(&hks->hks_lock);
1091 		return (ENXIO);
1092 	}
1093 
1094 	CVW_EXIT_WRITE(&hks->hks_lock);
1095 
1096 	if (!notifydone)
1097 		hook_stack_notify_run(hks, hfi->hfi_family.hf_name,
1098 		    HN_UNREGISTER);
1099 
1100 	hook_wait_unsetflag(&hks->hks_waiter, FWF_DEL_ACTIVE);
1101 
1102 	return (0);
1103 }
1104 
1105 /*
1106  * Function:	hook_family_copy
1107  * Returns:	internal family pointer - NULL = Failed
1108  * Parameters:	src(I) - family pointer
1109  *
1110  * Allocate internal family block and duplicate incoming family
1111  * No locks should be held across this function as it may sleep.
1112  */
1113 static hook_family_int_t *
1114 hook_family_copy(hook_family_t *src)
1115 {
1116 	hook_family_int_t *new;
1117 	hook_family_t *dst;
1118 
1119 	ASSERT(src != NULL);
1120 	ASSERT(src->hf_name != NULL);
1121 
1122 	new = (hook_family_int_t *)kmem_zalloc(sizeof (*new), KM_SLEEP);
1123 
1124 	/* Copy body */
1125 	dst = &new->hfi_family;
1126 	*dst = *src;
1127 
1128 	SLIST_INIT(&new->hfi_head);
1129 	TAILQ_INIT(&new->hfi_nhead);
1130 
1131 	/* Copy name */
1132 	dst->hf_name = (char *)kmem_alloc(strlen(src->hf_name) + 1, KM_SLEEP);
1133 	(void) strcpy(dst->hf_name, src->hf_name);
1134 
1135 	return (new);
1136 }
1137 
1138 /*
1139  * Function:	hook_family_find
1140  * Returns:	internal family pointer - NULL = Not match
1141  * Parameters:	family(I) - family name string
1142  *
1143  * Search family list with family name
1144  *	A lock on hfi_lock must be held when called.
1145  */
1146 static hook_family_int_t *
1147 hook_family_find(char *family, hook_stack_t *hks)
1148 {
1149 	hook_family_int_t *hfi = NULL;
1150 
1151 	ASSERT(family != NULL);
1152 
1153 	SLIST_FOREACH(hfi, &hks->hks_familylist, hfi_entry) {
1154 		if (strcmp(hfi->hfi_family.hf_name, family) == 0)
1155 			break;
1156 	}
1157 	return (hfi);
1158 }
1159 
1160 /*
1161  * Function:	hook_family_notify_register
1162  * Returns:	int         - 0 = success, else failure
1163  * Parameters:	hfi(I)      - hook family
1164  *              callback(I) - function to be called
1165  *              arg(I)      - arg to provide callback when it is called
1166  *
1167  * So long as this hook stack isn't being shut down, register a new
1168  * callback to be activated each time a new event is added to this
1169  * family.
1170  *
1171  * To call this function we must have an active handle in use on the family,
1172  * so if we take this into account, then neither the hook_family_int_t nor
1173  * the hook_stack_t that owns it can disappear. We have to put some trust
1174  * in the callers to be properly synchronised...
1175  *
1176  * Holding hks_lock is required to provide synchronisation for hks_shutdown.
1177  */
1178 int
1179 hook_family_notify_register(hook_family_int_t *hfi,
1180     hook_notify_fn_t callback, void *arg)
1181 {
1182 	hook_event_int_t *hei;
1183 	hook_stack_t *hks;
1184 	boolean_t canrun;
1185 	int error;
1186 
1187 	ASSERT(hfi != NULL);
1188 	canrun = B_FALSE;
1189 	hks = hfi->hfi_stack;
1190 
1191 	CVW_ENTER_READ(&hks->hks_lock);
1192 
1193 	if ((hfi->hfi_stack->hks_shutdown != 0) ||
1194 	    hfi->hfi_condemned || hfi->hfi_shutdown) {
1195 		CVW_EXIT_READ(&hks->hks_lock);
1196 		return (ESHUTDOWN);
1197 	}
1198 
1199 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1200 	canrun = (hook_wait_setflag(&hfi->hfi_waiter, FWF_ADD_WAIT_MASK,
1201 	    FWF_ADD_WANTED, FWF_ADD_ACTIVE) != -1);
1202 	error = hook_notify_register(&hfi->hfi_nhead, callback, arg);
1203 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1204 
1205 	CVW_EXIT_READ(&hks->hks_lock);
1206 
1207 	if (error == 0 && canrun) {
1208 		SLIST_FOREACH(hei, &hfi->hfi_head, hei_entry) {
1209 			callback(HN_REGISTER, arg,
1210 			    hfi->hfi_family.hf_name, NULL,
1211 			    hei->hei_event->he_name);
1212 		}
1213 	}
1214 
1215 	if (canrun)
1216 		hook_wait_unsetflag(&hfi->hfi_waiter, FWF_ADD_ACTIVE);
1217 
1218 	return (error);
1219 }
1220 
1221 /*
1222  * Function:	hook_family_notify_unregister
1223  * Returns:	int         - 0 = success, else failure
1224  * Parameters:	hfi(I)      - hook family
1225  *              callback(I) - function to be called
1226  *
1227  * Remove a callback from the list of those executed when a new event is
1228  * added to a hook family. If the family is not in the process of being
1229  * destroyed then simulate an unregister callback for each event that is
1230  * on the family. This pairs up with the hook_family_notify_register
1231  * action that simulates register events.
1232  * The order of what happens here is important and goes like this.
1233  * 1) Remove the callback from the list of functions to be called as part
1234  *    of the notify operation when an event is added or removed from the
1235  *    hook family.
1236  * 2) If the hook_family_int_t structure is on death row (free_family will
1237  *    be set to true) then there's nothing else to do than let it be free'd.
1238  * 3) If the structure isn't about to die, mark it up as being busy using
1239  *    hook_wait_setflag and then drop the lock so the loop can be run.
1240  * 4) if hook_wait_setflag was successful, tell all of the notify callback
1241  *    functions that this family has been unregistered.
1242  * 5) Cleanup
1243  */
1244 int
1245 hook_family_notify_unregister(hook_family_int_t *hfi,
1246     hook_notify_fn_t callback)
1247 {
1248 	hook_event_int_t *hei;
1249 	boolean_t free_family;
1250 	boolean_t canrun;
1251 	int error;
1252 	void *arg;
1253 
1254 	canrun = B_FALSE;
1255 
1256 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1257 
1258 	(void) hook_wait_setflag(&hfi->hfi_waiter, FWF_DEL_WAIT_MASK,
1259 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE);
1260 
1261 	error = hook_notify_unregister(&hfi->hfi_nhead, callback, &arg);
1262 
1263 	hook_wait_unsetflag(&hfi->hfi_waiter, FWF_DEL_ACTIVE);
1264 
1265 	/*
1266 	 * If hook_family_remove has been called but the structure was still
1267 	 * "busy" ... but we might have just made it "unbusy"...
1268 	 */
1269 	if ((error == 0) && hfi->hfi_condemned &&
1270 	    SLIST_EMPTY(&hfi->hfi_head) && TAILQ_EMPTY(&hfi->hfi_nhead)) {
1271 		free_family = B_TRUE;
1272 	} else {
1273 		free_family = B_FALSE;
1274 	}
1275 
1276 	if (error == 0 && !free_family) {
1277 		canrun = (hook_wait_setflag(&hfi->hfi_waiter, FWF_ADD_WAIT_MASK,
1278 		    FWF_ADD_WANTED, FWF_ADD_ACTIVE) != -1);
1279 	}
1280 
1281 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1282 
1283 	if (canrun) {
1284 		SLIST_FOREACH(hei, &hfi->hfi_head, hei_entry) {
1285 			callback(HN_UNREGISTER, arg,
1286 			    hfi->hfi_family.hf_name, NULL,
1287 			    hei->hei_event->he_name);
1288 		}
1289 
1290 		hook_wait_unsetflag(&hfi->hfi_waiter, FWF_ADD_ACTIVE);
1291 	} else if (free_family) {
1292 		hook_family_free(hfi, hfi->hfi_stack);
1293 	}
1294 
1295 	return (error);
1296 }
1297 
1298 /*
1299  * Function:	hook_event_add
1300  * Returns:	internal event pointer - NULL = Fail
1301  * Parameters:	hfi(I) - internal family pointer
1302  *		he(I)  - event pointer
1303  *
1304  * Add new event to event list on specific family.
1305  * This function can fail to return successfully if (1) it cannot allocate
1306  * enough memory for its own internal data structures, (2) the event has
1307  * already been registered (for any hook family.)
1308  */
1309 hook_event_int_t *
1310 hook_event_add(hook_family_int_t *hfi, hook_event_t *he)
1311 {
1312 	hook_event_int_t *hei, *new;
1313 	hook_stack_t *hks;
1314 
1315 	ASSERT(hfi != NULL);
1316 	ASSERT(he != NULL);
1317 	ASSERT(he->he_name != NULL);
1318 
1319 	new = hook_event_copy(he);
1320 	if (new == NULL)
1321 		return (NULL);
1322 
1323 	hks = hfi->hfi_stack;
1324 	CVW_ENTER_READ(&hks->hks_lock);
1325 
1326 	hks = hfi->hfi_stack;
1327 	if (hks->hks_shutdown != 0) {
1328 		CVW_EXIT_READ(&hks->hks_lock);
1329 		hook_event_free(new, NULL);
1330 		return (NULL);
1331 	}
1332 
1333 	/* Check whether this event pointer is already registered */
1334 	hei = hook_event_checkdup(he, hks);
1335 	if (hei != NULL) {
1336 		CVW_EXIT_READ(&hks->hks_lock);
1337 		hook_event_free(new, NULL);
1338 		return (NULL);
1339 	}
1340 
1341 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1342 
1343 	if (hfi->hfi_condemned || hfi->hfi_shutdown) {
1344 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1345 		CVW_EXIT_READ(&hks->hks_lock);
1346 		hook_event_free(new, NULL);
1347 		return (NULL);
1348 	}
1349 	CVW_EXIT_READ(&hks->hks_lock);
1350 
1351 	if (hook_wait_setflag(&hfi->hfi_waiter, FWF_ADD_WAIT_MASK,
1352 	    FWF_ADD_WANTED, FWF_ADD_ACTIVE) == -1) {
1353 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1354 		hook_event_free(new, NULL);
1355 		return (NULL);
1356 	}
1357 
1358 	TAILQ_INIT(&new->hei_nhead);
1359 
1360 	hook_event_init_kstats(hfi, new);
1361 	hook_wait_init(&new->hei_waiter, &new->hei_lock);
1362 
1363 	/* Add to event list head */
1364 	SLIST_INSERT_HEAD(&hfi->hfi_head, new, hei_entry);
1365 
1366 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1367 
1368 	hook_notify_run(&hfi->hfi_nhead,
1369 	    hfi->hfi_family.hf_name, NULL, he->he_name, HN_REGISTER);
1370 
1371 	hook_wait_unsetflag(&hfi->hfi_waiter, FWF_ADD_ACTIVE);
1372 
1373 	return (new);
1374 }
1375 
1376 /*
1377  * Function:	hook_event_init_kstats
1378  * Returns:	None
1379  * Parameters:  hfi(I) - pointer to the family that owns this event.
1380  *              hei(I) - pointer to the hook event that needs some kstats.
1381  *
1382  * Create a set of kstats that relate to each event registered with
1383  * the hook framework.  A counter is kept for each time the event is
1384  * activated and for each time a hook is added or removed.  As the
1385  * kstats just count the events as they happen, the total number of
1386  * hooks registered must be obtained by subtractived removed from added.
1387  */
1388 static void
1389 hook_event_init_kstats(hook_family_int_t *hfi, hook_event_int_t *hei)
1390 {
1391 	hook_event_kstat_t template = {
1392 		{ "hooksAdded",		KSTAT_DATA_UINT64 },
1393 		{ "hooksRemoved",	KSTAT_DATA_UINT64 },
1394 		{ "events",		KSTAT_DATA_UINT64 }
1395 	};
1396 	hook_stack_t *hks;
1397 
1398 	hks = hfi->hfi_stack;
1399 	hei->hei_kstatp = kstat_create_netstack(hfi->hfi_family.hf_name, 0,
1400 	    hei->hei_event->he_name, "hook_event", KSTAT_TYPE_NAMED,
1401 	    sizeof (hei->hei_kstats) / sizeof (kstat_named_t),
1402 	    KSTAT_FLAG_VIRTUAL, hks->hks_netstackid);
1403 
1404 	bcopy((char *)&template, &hei->hei_kstats, sizeof (template));
1405 
1406 	if (hei->hei_kstatp != NULL) {
1407 		hei->hei_kstatp->ks_data = (void *)&hei->hei_kstats;
1408 		hei->hei_kstatp->ks_private =
1409 		    (void *)(uintptr_t)hks->hks_netstackid;
1410 
1411 		kstat_install(hei->hei_kstatp);
1412 	}
1413 }
1414 
1415 /*
1416  * Function:	hook_event_remove
1417  * Returns:	int    - 0 = success, else = failure
1418  * Parameters:	hfi(I) - internal family pointer
1419  *		he(I)  - event pointer
1420  *
1421  * Remove event from event list on specific family
1422  *
1423  * This function assumes that the caller has received a pointer to a the
1424  * hook_family_int_t via a call to net_protocol_lookup or net_protocol_unreg'.
1425  * This the hook_family_int_t is guaranteed to be around for the life of this
1426  * call, unless the caller has decided to call net_protocol_release or
1427  * net_protocol_unregister before calling net_event_unregister - an error.
1428  */
1429 int
1430 hook_event_remove(hook_family_int_t *hfi, hook_event_t *he)
1431 {
1432 	boolean_t free_family;
1433 	hook_event_int_t *hei;
1434 	boolean_t notifydone;
1435 
1436 	ASSERT(hfi != NULL);
1437 	ASSERT(he != NULL);
1438 
1439 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1440 
1441 	/*
1442 	 * Set the flag so that we can call hook_event_notify_run without
1443 	 * holding any locks but at the same time prevent other changes to
1444 	 * the event at the same time.
1445 	 */
1446 	if (hook_wait_setflag(&hfi->hfi_waiter, FWF_DEL_WAIT_MASK,
1447 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE) == -1) {
1448 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1449 		return (ENXIO);
1450 	}
1451 
1452 	hei = hook_event_find(hfi, he->he_name);
1453 	if (hei == NULL) {
1454 		hook_wait_unsetflag(&hfi->hfi_waiter, FWF_DEL_ACTIVE);
1455 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1456 		return (ESRCH);
1457 	}
1458 
1459 	free_family = B_FALSE;
1460 
1461 	CVW_ENTER_WRITE(&hei->hei_lock);
1462 	/*
1463 	 * The hei_shutdown flag is used to indicate whether or not we have
1464 	 * done a shutdown and thus already walked through the notify list.
1465 	 */
1466 	notifydone = hei->hei_shutdown;
1467 	hei->hei_shutdown = B_TRUE;
1468 	/*
1469 	 * If there are any hooks still registered for this event or
1470 	 * there are any notifiers registered, return an error indicating
1471 	 * that the event is still busy.
1472 	 */
1473 	if (!TAILQ_EMPTY(&hei->hei_head) || !TAILQ_EMPTY(&hei->hei_nhead)) {
1474 		hei->hei_condemned = B_TRUE;
1475 		CVW_EXIT_WRITE(&hei->hei_lock);
1476 	} else {
1477 		/* hei_condemned = B_FALSE is implied from creation */
1478 		/*
1479 		 * Even though we know the notify list is empty, we call
1480 		 * hook_wait_destroy here to synchronise wait removing a
1481 		 * hook from an event.
1482 		 */
1483 		VERIFY(hook_wait_destroy(&hei->hei_waiter) == 0);
1484 
1485 		CVW_EXIT_WRITE(&hei->hei_lock);
1486 
1487 		if (hfi->hfi_condemned && SLIST_EMPTY(&hfi->hfi_head) &&
1488 		    TAILQ_EMPTY(&hfi->hfi_nhead))
1489 			free_family = B_TRUE;
1490 	}
1491 
1492 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1493 
1494 	if (!notifydone)
1495 		hook_notify_run(&hfi->hfi_nhead,
1496 		    hfi->hfi_family.hf_name, NULL, he->he_name, HN_UNREGISTER);
1497 
1498 	hook_wait_unsetflag(&hfi->hfi_waiter, FWF_DEL_ACTIVE);
1499 
1500 	if (!hei->hei_condemned) {
1501 		hook_event_free(hei, hfi);
1502 		if (free_family)
1503 			hook_family_free(hfi, hfi->hfi_stack);
1504 	}
1505 
1506 	return (0);
1507 }
1508 
1509 /*
1510  * Function:	hook_event_shutdown
1511  * Returns:	int    - 0 = success, else = failure
1512  * Parameters:	hfi(I) - internal family pointer
1513  *		he(I)  - event pointer
1514  *
1515  * As with hook_family_shutdown, we want to generate the notify callbacks
1516  * as if the event was being removed but not actually do the remove.
1517  */
1518 int
1519 hook_event_shutdown(hook_family_int_t *hfi, hook_event_t *he)
1520 {
1521 	hook_event_int_t *hei;
1522 	boolean_t notifydone;
1523 
1524 	ASSERT(hfi != NULL);
1525 	ASSERT(he != NULL);
1526 
1527 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1528 
1529 	/*
1530 	 * Set the flag so that we can call hook_event_notify_run without
1531 	 * holding any locks but at the same time prevent other changes to
1532 	 * the event at the same time.
1533 	 */
1534 	if (hook_wait_setflag(&hfi->hfi_waiter, FWF_DEL_WAIT_MASK,
1535 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE) == -1) {
1536 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1537 		return (ENXIO);
1538 	}
1539 
1540 	hei = hook_event_find(hfi, he->he_name);
1541 	if (hei == NULL) {
1542 		hook_wait_unsetflag(&hfi->hfi_waiter, FWF_DEL_ACTIVE);
1543 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1544 		return (ESRCH);
1545 	}
1546 
1547 	CVW_ENTER_WRITE(&hei->hei_lock);
1548 	notifydone = hei->hei_shutdown;
1549 	hei->hei_shutdown = B_TRUE;
1550 	CVW_EXIT_WRITE(&hei->hei_lock);
1551 
1552 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1553 
1554 	if (!notifydone)
1555 		hook_notify_run(&hfi->hfi_nhead,
1556 		    hfi->hfi_family.hf_name, NULL, he->he_name, HN_UNREGISTER);
1557 
1558 	hook_wait_unsetflag(&hfi->hfi_waiter, FWF_DEL_ACTIVE);
1559 
1560 	return (0);
1561 }
1562 
1563 /*
1564  * Function:	hook_event_free
1565  * Returns:	None
1566  * Parameters:	hei(I) - internal event pointer
1567  *
1568  * Free alloc memory for event
1569  */
1570 static void
1571 hook_event_free(hook_event_int_t *hei, hook_family_int_t *hfi)
1572 {
1573 	boolean_t free_family;
1574 
1575 	ASSERT(hei != NULL);
1576 
1577 	if (hfi != NULL) {
1578 		CVW_ENTER_WRITE(&hfi->hfi_lock);
1579 		/*
1580 		 * Remove the event from the hook family's list.
1581 		 */
1582 		SLIST_REMOVE(&hfi->hfi_head, hei, hook_event_int, hei_entry);
1583 		if (hfi->hfi_condemned && SLIST_EMPTY(&hfi->hfi_head) &&
1584 		    TAILQ_EMPTY(&hfi->hfi_nhead)) {
1585 			free_family = B_TRUE;
1586 		} else {
1587 			free_family = B_FALSE;
1588 		}
1589 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1590 	}
1591 
1592 	if (hei->hei_kstatp != NULL) {
1593 		ASSERT(hfi != NULL);
1594 
1595 		kstat_delete_netstack(hei->hei_kstatp,
1596 		    hfi->hfi_stack->hks_netstackid);
1597 		hei->hei_kstatp = NULL;
1598 	}
1599 
1600 	/* Free container */
1601 	kmem_free(hei, sizeof (*hei));
1602 
1603 	if (free_family)
1604 		hook_family_free(hfi, hfi->hfi_stack);
1605 }
1606 
1607 /*
1608  * Function:    hook_event_checkdup
1609  * Returns:     internal event pointer - NULL = Not match
1610  * Parameters:  he(I) - event pointer
1611  *
1612  * Search all of the hook families to see if the event being passed in
1613  * has already been associated with one.
1614  */
1615 static hook_event_int_t *
1616 hook_event_checkdup(hook_event_t *he, hook_stack_t *hks)
1617 {
1618 	hook_family_int_t *hfi;
1619 	hook_event_int_t *hei;
1620 
1621 	ASSERT(he != NULL);
1622 
1623 	CVW_ENTER_READ(&hks->hks_lock);
1624 	SLIST_FOREACH(hfi, &hks->hks_familylist, hfi_entry) {
1625 		SLIST_FOREACH(hei, &hfi->hfi_head, hei_entry) {
1626 			if (hei->hei_event == he) {
1627 				CVW_EXIT_READ(&hks->hks_lock);
1628 				return (hei);
1629 			}
1630 		}
1631 	}
1632 	CVW_EXIT_READ(&hks->hks_lock);
1633 
1634 	return (NULL);
1635 }
1636 
1637 /*
1638  * Function:	hook_event_copy
1639  * Returns:	internal event pointer - NULL = Failed
1640  * Parameters:	src(I) - event pointer
1641  *
1642  * Allocate internal event block and duplicate incoming event
1643  * No locks should be held across this function as it may sleep.
1644  */
1645 static hook_event_int_t *
1646 hook_event_copy(hook_event_t *src)
1647 {
1648 	hook_event_int_t *new;
1649 
1650 	ASSERT(src != NULL);
1651 	ASSERT(src->he_name != NULL);
1652 
1653 	new = (hook_event_int_t *)kmem_zalloc(sizeof (*new), KM_SLEEP);
1654 
1655 	/* Copy body */
1656 	TAILQ_INIT(&new->hei_head);
1657 	new->hei_event = src;
1658 
1659 	return (new);
1660 }
1661 
1662 /*
1663  * Function:	hook_event_find
1664  * Returns:	internal event pointer - NULL = Not match
1665  * Parameters:	hfi(I)   - internal family pointer
1666  *		event(I) - event name string
1667  *
1668  * Search event list with event name
1669  *	A lock on hfi->hfi_lock must be held when called.
1670  */
1671 static hook_event_int_t *
1672 hook_event_find(hook_family_int_t *hfi, char *event)
1673 {
1674 	hook_event_int_t *hei = NULL;
1675 
1676 	ASSERT(hfi != NULL);
1677 	ASSERT(event != NULL);
1678 
1679 	SLIST_FOREACH(hei, &hfi->hfi_head, hei_entry) {
1680 		if ((strcmp(hei->hei_event->he_name, event) == 0) &&
1681 		    ((hei->hei_waiter.fw_flags & FWF_UNSAFE) == 0))
1682 			break;
1683 	}
1684 	return (hei);
1685 }
1686 
1687 /*
1688  * Function:	hook_event_notify_register
1689  * Returns:	int         - 0 = success, else failure
1690  * Parameters:	hfi(I)      - hook family
1691  *              event(I)    - name of the event
1692  *              callback(I) - function to be called
1693  *              arg(I)      - arg to provide callback when it is called
1694  *
1695  * Adds a new callback to the event named by "event" (we must find it)
1696  * that will be executed each time a new hook is added to the event.
1697  * Of course, if the stack is being shut down, this call should fail.
1698  */
1699 int
1700 hook_event_notify_register(hook_family_int_t *hfi, char *event,
1701     hook_notify_fn_t callback, void *arg)
1702 {
1703 	hook_event_int_t *hei;
1704 	hook_stack_t *hks;
1705 	boolean_t canrun;
1706 	hook_int_t *h;
1707 	int error;
1708 
1709 	canrun = B_FALSE;
1710 	hks = hfi->hfi_stack;
1711 	CVW_ENTER_READ(&hks->hks_lock);
1712 	if (hks->hks_shutdown != 0) {
1713 		CVW_EXIT_READ(&hks->hks_lock);
1714 		return (ESHUTDOWN);
1715 	}
1716 
1717 	CVW_ENTER_READ(&hfi->hfi_lock);
1718 
1719 	if (hfi->hfi_condemned || hfi->hfi_shutdown) {
1720 		CVW_EXIT_READ(&hfi->hfi_lock);
1721 		CVW_EXIT_READ(&hks->hks_lock);
1722 		return (ESHUTDOWN);
1723 	}
1724 
1725 	hei = hook_event_find(hfi, event);
1726 	if (hei == NULL) {
1727 		CVW_EXIT_READ(&hfi->hfi_lock);
1728 		CVW_EXIT_READ(&hks->hks_lock);
1729 		return (ESRCH);
1730 	}
1731 
1732 	if (hei->hei_condemned || hei->hei_shutdown) {
1733 		CVW_EXIT_READ(&hfi->hfi_lock);
1734 		CVW_EXIT_READ(&hks->hks_lock);
1735 		return (ESHUTDOWN);
1736 	}
1737 
1738 	CVW_ENTER_WRITE(&hei->hei_lock);
1739 	canrun = (hook_wait_setflag(&hei->hei_waiter, FWF_ADD_WAIT_MASK,
1740 	    FWF_ADD_WANTED, FWF_ADD_ACTIVE) != -1);
1741 	error = hook_notify_register(&hei->hei_nhead, callback, arg);
1742 	CVW_EXIT_WRITE(&hei->hei_lock);
1743 
1744 	CVW_EXIT_READ(&hfi->hfi_lock);
1745 	CVW_EXIT_READ(&hks->hks_lock);
1746 
1747 	if (error == 0 && canrun) {
1748 		TAILQ_FOREACH(h, &hei->hei_head, hi_entry) {
1749 			callback(HN_REGISTER, arg,
1750 			    hfi->hfi_family.hf_name, hei->hei_event->he_name,
1751 			    h->hi_hook.h_name);
1752 		}
1753 	}
1754 
1755 	if (canrun)
1756 		hook_wait_unsetflag(&hei->hei_waiter, FWF_ADD_ACTIVE);
1757 
1758 	return (error);
1759 }
1760 
1761 /*
1762  * Function:	hook_event_notify_unregister
1763  * Returns:	int         - 0 = success, else failure
1764  * Parameters:	hfi(I)      - hook family
1765  *              event(I)    - name of the event
1766  *              callback(I) - function to be called
1767  *
1768  * Remove the given callback from the named event's list of functions
1769  * to call when a hook is added or removed.
1770  */
1771 int
1772 hook_event_notify_unregister(hook_family_int_t *hfi, char *event,
1773     hook_notify_fn_t callback)
1774 {
1775 	hook_event_int_t *hei;
1776 	boolean_t free_event;
1777 	boolean_t canrun;
1778 	hook_int_t *h;
1779 	void *arg;
1780 	int error;
1781 
1782 	canrun = B_FALSE;
1783 
1784 	CVW_ENTER_READ(&hfi->hfi_lock);
1785 
1786 	hei = hook_event_find(hfi, event);
1787 	if (hei == NULL) {
1788 		CVW_EXIT_READ(&hfi->hfi_lock);
1789 		return (ESRCH);
1790 	}
1791 
1792 	CVW_ENTER_WRITE(&hei->hei_lock);
1793 
1794 	(void) hook_wait_setflag(&hei->hei_waiter, FWF_DEL_WAIT_MASK,
1795 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE);
1796 
1797 	error = hook_notify_unregister(&hei->hei_nhead, callback, &arg);
1798 
1799 	hook_wait_unsetflag(&hei->hei_waiter, FWF_DEL_ACTIVE);
1800 
1801 	/*
1802 	 * hei_condemned has been set if someone tried to remove the
1803 	 * event but couldn't because there were still things attached to
1804 	 * it. Now that we've done a successful remove, if it is now empty
1805 	 * then by all rights we should be free'ing it too.  Note that the
1806 	 * expectation is that only the caller of hook_event_add will ever
1807 	 * call hook_event_remove.
1808 	 */
1809 	if ((error == 0) && hei->hei_condemned &&
1810 	    TAILQ_EMPTY(&hei->hei_head) && TAILQ_EMPTY(&hei->hei_nhead)) {
1811 		free_event = B_TRUE;
1812 	} else {
1813 		free_event = B_FALSE;
1814 	}
1815 
1816 	if (error == 0 && !free_event) {
1817 		canrun = (hook_wait_setflag(&hei->hei_waiter, FWF_ADD_WAIT_MASK,
1818 		    FWF_ADD_WANTED, FWF_ADD_ACTIVE) != -1);
1819 	}
1820 
1821 	CVW_EXIT_WRITE(&hei->hei_lock);
1822 	CVW_EXIT_READ(&hfi->hfi_lock);
1823 
1824 	if (canrun) {
1825 		TAILQ_FOREACH(h, &hei->hei_head, hi_entry) {
1826 			callback(HN_UNREGISTER, arg,
1827 			    hfi->hfi_family.hf_name, hei->hei_event->he_name,
1828 			    h->hi_hook.h_name);
1829 		}
1830 
1831 		hook_wait_unsetflag(&hei->hei_waiter, FWF_ADD_ACTIVE);
1832 	}
1833 
1834 	if (free_event) {
1835 		/*
1836 		 * It is safe to pass in hfi here, without a lock, because
1837 		 * our structure (hei) is still on one of its lists and thus
1838 		 * it won't be able to disappear yet...
1839 		 */
1840 		hook_event_free(hei, hfi);
1841 	}
1842 
1843 	return (error);
1844 }
1845 
1846 /*
1847  * Function:	hook_event_notify_run
1848  * Returns:	None
1849  * Parameters:	nrun(I) - pointer to the list of callbacks to execute
1850  *              hfi(I)  - hook stack pointer to execute callbacks for
1851  *              name(I) - name of a hook family
1852  *              cmd(I)  - either HN_UNREGISTER or HN_REGISTER
1853  *
1854  * Execute all of the callbacks registered for this event.
1855  */
1856 static void
1857 hook_event_notify_run(hook_event_int_t *hei, hook_family_int_t *hfi,
1858     char *event, char *name, hook_notify_cmd_t cmd)
1859 {
1860 
1861 	hook_notify_run(&hei->hei_nhead, hfi->hfi_family.hf_name,
1862 	    event, name, cmd);
1863 }
1864 
1865 /*
1866  * Function:	hook_register
1867  * Returns:	int      - 0 = success, else = failure
1868  * Parameters:	hfi(I)   - internal family pointer
1869  *		event(I) - event name string
1870  *		h(I)     - hook pointer
1871  *
1872  * Add new hook to hook list on the specified family and event.
1873  */
1874 int
1875 hook_register(hook_family_int_t *hfi, char *event, hook_t *h)
1876 {
1877 	hook_event_int_t *hei;
1878 	hook_int_t *hi, *new;
1879 	int error;
1880 
1881 	ASSERT(hfi != NULL);
1882 	ASSERT(event != NULL);
1883 	ASSERT(h != NULL);
1884 
1885 	if (hfi->hfi_stack->hks_shutdown)
1886 		return (0);
1887 
1888 	/* Alloc hook_int_t and copy hook */
1889 	new = hook_copy(h);
1890 	if (new == NULL)
1891 		return (ENOMEM);
1892 
1893 	/*
1894 	 * Since hook add/remove only impact event, so it is unnecessary
1895 	 * to hold global family write lock. Just get read lock here to
1896 	 * ensure event will not be removed when doing hooks operation
1897 	 */
1898 	CVW_ENTER_WRITE(&hfi->hfi_lock);
1899 
1900 	hei = hook_event_find(hfi, event);
1901 	if (hei == NULL) {
1902 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1903 		hook_int_free(new, hfi->hfi_stack->hks_netstackid);
1904 		return (ENXIO);
1905 	}
1906 
1907 	CVW_ENTER_WRITE(&hei->hei_lock);
1908 
1909 	/*
1910 	 * If we've run either the remove() or shutdown(), do not allow any
1911 	 * more hooks to be added to this event.
1912 	 */
1913 	if (hei->hei_shutdown) {
1914 		error = ESHUTDOWN;
1915 		goto bad_add;
1916 	}
1917 
1918 	hi = hook_find(hei, h);
1919 	if (hi != NULL) {
1920 		error = EEXIST;
1921 		goto bad_add;
1922 	}
1923 
1924 	if (hook_wait_setflag(&hei->hei_waiter, FWF_ADD_WAIT_MASK,
1925 	    FWF_ADD_WANTED, FWF_ADD_ACTIVE) == -1) {
1926 		error = ENOENT;
1927 bad_add:
1928 		CVW_EXIT_WRITE(&hei->hei_lock);
1929 		CVW_EXIT_WRITE(&hfi->hfi_lock);
1930 		hook_int_free(new, hfi->hfi_stack->hks_netstackid);
1931 		return (error);
1932 	}
1933 
1934 	/* Add to hook list head */
1935 	error = hook_insert(&hei->hei_head, new);
1936 	if (error == 0) {
1937 		hei->hei_event->he_interested = B_TRUE;
1938 		hei->hei_kstats.hooks_added.value.ui64++;
1939 
1940 		hook_init_kstats(hfi, hei, new);
1941 	}
1942 
1943 	CVW_EXIT_WRITE(&hei->hei_lock);
1944 	CVW_EXIT_WRITE(&hfi->hfi_lock);
1945 
1946 	/*
1947 	 * Note that the name string passed through to the notify callbacks
1948 	 * is from the original hook being registered, not the copy being
1949 	 * inserted.
1950 	 */
1951 	if (error == 0)
1952 		hook_event_notify_run(hei, hfi, event, h->h_name, HN_REGISTER);
1953 
1954 	hook_wait_unsetflag(&hei->hei_waiter, FWF_ADD_ACTIVE);
1955 
1956 	return (error);
1957 }
1958 
1959 /*
1960  * Function:	hook_insert
1961  * Returns:	int     - 0 = success, else = failure
1962  * Parameters:	head(I) - pointer to hook list to insert hook onto
1963  *		new(I)  - pointer to hook to be inserted
1964  *
1965  * Try to insert the hook onto the list of hooks according to the hints
1966  * given in the hook to be inserted and those that already exist on the
1967  * list.  For now, the implementation permits only a single hook to be
1968  * either first or last and names provided with before or after are only
1969  * loosely coupled with the action.
1970  */
1971 static int
1972 hook_insert(hook_int_head_t *head, hook_int_t *new)
1973 {
1974 	hook_int_t *before;
1975 	hook_int_t *hi;
1976 	hook_t *hih;
1977 	hook_t *h = &new->hi_hook;
1978 
1979 	switch (new->hi_hook.h_hint) {
1980 	case HH_NONE :
1981 		before = NULL;
1982 		/*
1983 		 * If there is no hint present (or not one that can be
1984 		 * satisfied now) then try to at least respect the wishes
1985 		 * of those that want to be last.  If there are none wanting
1986 		 * to be last then add the new hook to the tail of the
1987 		 * list - this means we keep any wanting to be first
1988 		 * happy without having to search for HH_FIRST.
1989 		 */
1990 		TAILQ_FOREACH(hi, head, hi_entry) {
1991 			hih = &hi->hi_hook;
1992 			if ((hih->h_hint == HH_AFTER) &&
1993 			    (strcmp(h->h_name,
1994 			    (char *)hih->h_hintvalue) == 0)) {
1995 				TAILQ_INSERT_BEFORE(hi, new, hi_entry);
1996 				return (0);
1997 			}
1998 			if ((hih->h_hint == HH_BEFORE) && (before == NULL) &&
1999 			    (strcmp(h->h_name,
2000 			    (char *)hih->h_hintvalue) == 0)) {
2001 				before = hi;
2002 			}
2003 		}
2004 		if (before != NULL) {
2005 			TAILQ_INSERT_AFTER(head, before, new, hi_entry);
2006 			return (0);
2007 		}
2008 		hook_insert_plain(head, new);
2009 		break;
2010 
2011 	case HH_FIRST :
2012 		hi = TAILQ_FIRST(head);
2013 		if ((hi != NULL) && (hi->hi_hook.h_hint == HH_FIRST))
2014 			return (EBUSY);
2015 		TAILQ_INSERT_HEAD(head, new, hi_entry);
2016 		break;
2017 
2018 	case HH_LAST :
2019 		hi = TAILQ_LAST(head, hook_int_head);
2020 		if ((hi != NULL) && (hi->hi_hook.h_hint == HH_LAST))
2021 			return (EBUSY);
2022 		TAILQ_INSERT_TAIL(head, new, hi_entry);
2023 		break;
2024 
2025 	case HH_BEFORE :
2026 		hi = hook_find_byname(head, (char *)new->hi_hook.h_hintvalue);
2027 		if (hi == NULL)
2028 			return (hook_insert_afterbefore(head, new));
2029 
2030 		if (hi->hi_hook.h_hint == HH_FIRST)
2031 			return (EBUSY);
2032 
2033 		TAILQ_INSERT_BEFORE(hi, new, hi_entry);
2034 		break;
2035 
2036 	case HH_AFTER :
2037 		hi = hook_find_byname(head, (char *)new->hi_hook.h_hintvalue);
2038 		if (hi == NULL)
2039 			return (hook_insert_afterbefore(head, new));
2040 
2041 		if (hi->hi_hook.h_hint == HH_LAST)
2042 			return (EBUSY);
2043 
2044 		TAILQ_INSERT_AFTER(head, hi, new, hi_entry);
2045 		break;
2046 
2047 	default :
2048 		return (EINVAL);
2049 	}
2050 
2051 	return (0);
2052 }
2053 
2054 /*
2055  * Function:	hook_insert_plain
2056  * Returns:	int     - 0 = success, else = failure
2057  * Parameters:	head(I) - pointer to hook list to insert hook onto
2058  *		new(I)  - pointer to hook to be inserted
2059  *
2060  * Insert a hook such that it respects the wishes of those that want to
2061  * be last.  If there are none wanting to be last then add the new hook
2062  * to the tail of the list - this means we keep any wanting to be first
2063  * happy without having to search for HH_FIRST.
2064  */
2065 static void
2066 hook_insert_plain(hook_int_head_t *head, hook_int_t *new)
2067 {
2068 	hook_int_t *hi;
2069 
2070 	hi = TAILQ_FIRST(head);
2071 	if (hi != NULL) {
2072 		if (hi->hi_hook.h_hint == HH_LAST) {
2073 			TAILQ_INSERT_BEFORE(hi, new, hi_entry);
2074 		} else {
2075 			TAILQ_INSERT_TAIL(head, new, hi_entry);
2076 		}
2077 	} else {
2078 		TAILQ_INSERT_TAIL(head, new, hi_entry);
2079 	}
2080 }
2081 
2082 /*
2083  * Function:	hook_insert_afterbefore
2084  * Returns:	int     - 0 = success, else = failure
2085  * Parameters:	head(I) - pointer to hook list to insert hook onto
2086  *		new(I)  - pointer to hook to be inserted
2087  *
2088  * Simple insertion of a hook specifying a HH_BEFORE or HH_AFTER was not
2089  * possible, so now we need to be more careful.  The first pass is to go
2090  * through the list and look for any other hooks that also specify the
2091  * same hint name as the new one.  The object of this exercise is to make
2092  * sure that hooks with HH_BEFORE always appear on the list before those
2093  * with HH_AFTER so that when said hook arrives, it can be placed in the
2094  * middle of the BEFOREs and AFTERs.  If this condition does not arise,
2095  * just use hook_insert_plain() to try and insert the hook somewhere that
2096  * is innocuous to existing efforts.
2097  */
2098 static int
2099 hook_insert_afterbefore(hook_int_head_t *head, hook_int_t *new)
2100 {
2101 	hook_int_t *hi;
2102 	hook_t *nh;
2103 	hook_t *h;
2104 
2105 	nh = &new->hi_hook;
2106 	ASSERT(new->hi_hook.h_hint != HH_NONE);
2107 	ASSERT(new->hi_hook.h_hint != HH_LAST);
2108 	ASSERT(new->hi_hook.h_hint != HH_FIRST);
2109 
2110 	/*
2111 	 * First, look through the list to see if there are any other
2112 	 * before's or after's that have a matching hint name.
2113 	 */
2114 	TAILQ_FOREACH(hi, head, hi_entry) {
2115 		h = &hi->hi_hook;
2116 		switch (h->h_hint) {
2117 		case HH_FIRST :
2118 		case HH_LAST :
2119 		case HH_NONE :
2120 			break;
2121 		case HH_BEFORE :
2122 			if ((nh->h_hint == HH_BEFORE) &&
2123 			    (strcmp((char *)h->h_hintvalue,
2124 			    (char *)nh->h_hintvalue) == 0)) {
2125 				TAILQ_INSERT_AFTER(head, hi, new, hi_entry);
2126 				return (0);
2127 			}
2128 			if ((nh->h_hint == HH_AFTER) &&
2129 			    (strcmp((char *)h->h_hintvalue,
2130 			    (char *)nh->h_hintvalue) == 0)) {
2131 				TAILQ_INSERT_BEFORE(hi, new, hi_entry);
2132 				return (0);
2133 			}
2134 			break;
2135 		case HH_AFTER :
2136 			if ((nh->h_hint == HH_AFTER) &&
2137 			    (strcmp((char *)h->h_hintvalue,
2138 			    (char *)nh->h_hintvalue) == 0)) {
2139 				TAILQ_INSERT_AFTER(head, hi, new, hi_entry);
2140 				return (0);
2141 			}
2142 			if ((nh->h_hint == HH_BEFORE) &&
2143 			    (strcmp((char *)h->h_hintvalue,
2144 			    (char *)nh->h_hintvalue) == 0)) {
2145 				TAILQ_INSERT_BEFORE(hi, new, hi_entry);
2146 				return (0);
2147 			}
2148 			break;
2149 		}
2150 	}
2151 
2152 	hook_insert_plain(head, new);
2153 
2154 	return (0);
2155 }
2156 
2157 /*
2158  * Function:	hook_unregister
2159  * Returns:	int      - 0 = success, else = failure
2160  * Parameters:	hfi(I)   - internal family pointer
2161  *		event(I) - event name string
2162  *		h(I)     - hook pointer
2163  *
2164  * Remove hook from hook list on specific family, event
2165  */
2166 int
2167 hook_unregister(hook_family_int_t *hfi, char *event, hook_t *h)
2168 {
2169 	hook_event_int_t *hei;
2170 	hook_int_t *hi;
2171 	boolean_t free_event;
2172 
2173 	ASSERT(hfi != NULL);
2174 	ASSERT(h != NULL);
2175 
2176 	CVW_ENTER_WRITE(&hfi->hfi_lock);
2177 
2178 	hei = hook_event_find(hfi, event);
2179 	if (hei == NULL) {
2180 		CVW_EXIT_WRITE(&hfi->hfi_lock);
2181 		return (ENXIO);
2182 	}
2183 
2184 	/* Hold write lock for event */
2185 	CVW_ENTER_WRITE(&hei->hei_lock);
2186 
2187 	hi = hook_find(hei, h);
2188 	if (hi == NULL) {
2189 		CVW_EXIT_WRITE(&hei->hei_lock);
2190 		CVW_EXIT_WRITE(&hfi->hfi_lock);
2191 		return (ENXIO);
2192 	}
2193 
2194 	if (hook_wait_setflag(&hei->hei_waiter, FWF_DEL_WAIT_MASK,
2195 	    FWF_DEL_WANTED, FWF_DEL_ACTIVE) == -1) {
2196 		CVW_EXIT_WRITE(&hei->hei_lock);
2197 		CVW_EXIT_WRITE(&hfi->hfi_lock);
2198 		return (ENOENT);
2199 	}
2200 
2201 	/* Remove from hook list */
2202 	TAILQ_REMOVE(&hei->hei_head, hi, hi_entry);
2203 
2204 	free_event = B_FALSE;
2205 	if (TAILQ_EMPTY(&hei->hei_head)) {
2206 		hei->hei_event->he_interested = B_FALSE;
2207 		/*
2208 		 * If the delete pending flag has been set and there are
2209 		 * no notifiers on the event (and we've removed the last
2210 		 * hook) then we need to free this event after we're done.
2211 		 */
2212 		if (hei->hei_condemned && TAILQ_EMPTY(&hei->hei_nhead))
2213 			free_event = B_TRUE;
2214 	}
2215 	hei->hei_kstats.hooks_removed.value.ui64++;
2216 
2217 	CVW_EXIT_WRITE(&hei->hei_lock);
2218 	CVW_EXIT_WRITE(&hfi->hfi_lock);
2219 	/*
2220 	 * While the FWF_DEL_ACTIVE flag is set, the hook_event_int_t
2221 	 * will not be free'd and thus the hook_family_int_t wil not
2222 	 * be free'd either.
2223 	 */
2224 	hook_event_notify_run(hei, hfi, event, h->h_name, HN_UNREGISTER);
2225 	hook_wait_unsetflag(&hei->hei_waiter, FWF_DEL_ACTIVE);
2226 
2227 	hook_int_free(hi, hfi->hfi_stack->hks_netstackid);
2228 
2229 	if (free_event)
2230 		hook_event_free(hei, hfi);
2231 
2232 	return (0);
2233 }
2234 
2235 /*
2236  * Function:	hook_find_byname
2237  * Returns:	internal hook pointer - NULL = Not match
2238  * Parameters:	hei(I) - internal event pointer
2239  *		name(I)- hook name
2240  *
2241  * Search an event's list of hooks to see if there is a hook present that
2242  * has a matching name to the one being looked for.
2243  */
2244 static hook_int_t *
2245 hook_find_byname(hook_int_head_t *head, char *name)
2246 {
2247 	hook_int_t *hi;
2248 
2249 	TAILQ_FOREACH(hi, head, hi_entry) {
2250 		if (strcmp(hi->hi_hook.h_name, name) == 0)
2251 			return (hi);
2252 	}
2253 
2254 	return (NULL);
2255 }
2256 
2257 /*
2258  * Function:	hook_find
2259  * Returns:	internal hook pointer - NULL = Not match
2260  * Parameters:	hei(I) - internal event pointer
2261  *		h(I)   - hook pointer
2262  *
2263  * Search an event's list of hooks to see if there is already one that
2264  * matches the hook being passed in.  Currently the only criteria for a
2265  * successful search here is for the names to be the same.
2266  */
2267 static hook_int_t *
2268 hook_find(hook_event_int_t *hei, hook_t *h)
2269 {
2270 
2271 	ASSERT(hei != NULL);
2272 	ASSERT(h != NULL);
2273 
2274 	return (hook_find_byname(&hei->hei_head, h->h_name));
2275 }
2276 
2277 /*
2278  * Function:	hook_copy
2279  * Returns:	internal hook pointer - NULL = Failed
2280  * Parameters:	src(I) - hook pointer
2281  *
2282  * Allocate internal hook block and duplicate incoming hook.
2283  * No locks should be held across this function as it may sleep.
2284  * Because hook_copy() is responsible for the creation of the internal
2285  * hook structure that is used here, it takes on population the structure
2286  * with the kstat information.  Note that while the kstat bits are
2287  * seeded here, their installation of the kstats is handled elsewhere.
2288  */
2289 static hook_int_t *
2290 hook_copy(hook_t *src)
2291 {
2292 	hook_int_t *new;
2293 	hook_t *dst;
2294 	int len;
2295 
2296 	ASSERT(src != NULL);
2297 	ASSERT(src->h_name != NULL);
2298 
2299 	new = (hook_int_t *)kmem_zalloc(sizeof (*new), KM_SLEEP);
2300 
2301 	/* Copy body */
2302 	dst = &new->hi_hook;
2303 	*dst = *src;
2304 
2305 	/* Copy name */
2306 	len = strlen(src->h_name);
2307 	dst->h_name = (char *)kmem_alloc(len + 1, KM_SLEEP);
2308 	(void) strcpy(dst->h_name, src->h_name);
2309 
2310 	/*
2311 	 * This is initialised in this manner to make it safer to use the
2312 	 * same pointer in the kstats field.
2313 	 */
2314 	dst->h_hintvalue = (uintptr_t)"";
2315 
2316 	if (dst->h_hint == HH_BEFORE || dst->h_hint == HH_AFTER) {
2317 		len = strlen((char *)src->h_hintvalue);
2318 		if (len > 0) {
2319 			dst->h_hintvalue = (uintptr_t)kmem_alloc(len + 1,
2320 			    KM_SLEEP);
2321 			(void) strcpy((char *)dst->h_hintvalue,
2322 			    (char *)src->h_hintvalue);
2323 		}
2324 	}
2325 
2326 	return (new);
2327 }
2328 
2329 /*
2330  * Function:	hook_init_kstats
2331  * Returns:	None
2332  * Parameters:  hfi(I) - pointer to the family that owns the event.
2333  *              hei(I) - pointer to the event that owns this hook
2334  *              hi(I)  - pointer to the hook for which we create kstats for
2335  *
2336  * Each hook that is registered with this framework has its own kstats
2337  * set up so that we can provide an easy way in which to observe the
2338  * look of hooks (using the kstat command.) The position is set to 0
2339  * here but is recalculated after we know the insertion has been a
2340  * success.
2341  */
2342 static void
2343 hook_init_kstats(hook_family_int_t *hfi, hook_event_int_t *hei, hook_int_t *hi)
2344 {
2345 	hook_hook_kstat_t template = {
2346 		{ "version",			KSTAT_DATA_INT32 },
2347 		{ "flags",			KSTAT_DATA_UINT32 },
2348 		{ "hint",			KSTAT_DATA_INT32 },
2349 		{ "hint_value",			KSTAT_DATA_STRING },
2350 		{ "position",			KSTAT_DATA_INT32 },
2351 		{ "hook_hits",			KSTAT_DATA_UINT64 }
2352 	};
2353 	hook_stack_t *hks;
2354 	size_t kslen;
2355 	int position;
2356 	hook_int_t *h;
2357 
2358 	kslen = strlen(hfi->hfi_family.hf_name) +
2359 	    strlen(hei->hei_event->he_name) + 2;
2360 
2361 	hi->hi_ksname = (char *)kmem_zalloc(kslen, KM_SLEEP);
2362 	(void) snprintf(hi->hi_ksname, kslen, "%s/%s",
2363 	    hfi->hfi_family.hf_name, hei->hei_event->he_name);
2364 
2365 	hks = hfi->hfi_stack;
2366 	hi->hi_kstatp = kstat_create_netstack(hi->hi_ksname, 0,
2367 	    hi->hi_hook.h_name, "hook", KSTAT_TYPE_NAMED,
2368 	    sizeof (hi->hi_kstats) / sizeof (kstat_named_t),
2369 	    KSTAT_FLAG_VIRTUAL, hks->hks_netstackid);
2370 
2371 	/* Initialise the kstats for the structure */
2372 	bcopy(&template, &hi->hi_kstats, sizeof (template));
2373 	hi->hi_kstats.hook_version.value.i32 = hi->hi_hook.h_version;
2374 	hi->hi_kstats.hook_flags.value.ui32 = hi->hi_hook.h_flags;
2375 	hi->hi_kstats.hook_hint.value.i32 = hi->hi_hook.h_hint;
2376 	hi->hi_kstats.hook_position.value.i32 = 0;
2377 	hi->hi_kstats.hook_hits.value.ui64 = 0;
2378 
2379 	switch (hi->hi_hook.h_hint) {
2380 	case HH_BEFORE :
2381 	case HH_AFTER :
2382 		kstat_named_setstr(&(hi->hi_kstats.hook_hintvalue),
2383 		    (const char *)hi->hi_hook.h_hintvalue);
2384 		break;
2385 	default :
2386 		kstat_named_setstr(&(hi->hi_kstats.hook_hintvalue),
2387 		    hook_hintvalue_none);
2388 		break;
2389 	}
2390 
2391 	if (hi->hi_kstatp != NULL) {
2392 		hi->hi_kstatp->ks_data = (void *)&hi->hi_kstats;
2393 		hi->hi_kstatp->ks_private =
2394 		    (void *)(uintptr_t)hks->hks_netstackid;
2395 		hi->hi_kstatp->ks_data_size +=
2396 		    KSTAT_NAMED_STR_BUFLEN(&(hi->hi_kstats.hook_hintvalue)) + 1;
2397 
2398 		kstat_install(hi->hi_kstatp);
2399 	}
2400 
2401 	position = 1;
2402 	TAILQ_FOREACH(h, &hei->hei_head, hi_entry) {
2403 		h->hi_kstats.hook_position.value.ui32 = position++;
2404 	}
2405 }
2406 
2407 /*
2408  * Function:	hook_int_free
2409  * Returns:	None
2410  * Parameters:	hi(I) - internal hook pointer
2411  *
2412  * Free memory allocated to support a hook.
2413  */
2414 static void
2415 hook_int_free(hook_int_t *hi, netstackid_t stackid)
2416 {
2417 	int len;
2418 
2419 	ASSERT(hi != NULL);
2420 
2421 	/* Free name space */
2422 	if (hi->hi_hook.h_name != NULL) {
2423 		kmem_free(hi->hi_hook.h_name, strlen(hi->hi_hook.h_name) + 1);
2424 	}
2425 	if (hi->hi_ksname != NULL) {
2426 		kmem_free(hi->hi_ksname, strlen(hi->hi_ksname) + 1);
2427 	}
2428 
2429 	/* Free the name used with the before/after hints. */
2430 	switch (hi->hi_hook.h_hint) {
2431 	case HH_BEFORE :
2432 	case HH_AFTER :
2433 		len = strlen((char *)hi->hi_hook.h_hintvalue);
2434 		if (len > 0)
2435 			kmem_free((void *)hi->hi_hook.h_hintvalue, len + 1);
2436 		break;
2437 	default :
2438 		break;
2439 	}
2440 
2441 	if (hi->hi_kstatp != NULL)
2442 		kstat_delete_netstack(hi->hi_kstatp, stackid);
2443 
2444 	/* Free container */
2445 	kmem_free(hi, sizeof (*hi));
2446 }
2447 
2448 /*
2449  * Function:	hook_alloc
2450  * Returns:	hook_t *   - pointer to new hook structure
2451  * Parameters:	version(I) - version number of the API when compiled
2452  *
2453  * This function serves as the interface for consumers to obtain a hook_t
2454  * structure.  At this point in time, there is only a single "version" of
2455  * it, leading to a straight forward function.  In a perfect world the
2456  * h_vesion would be a protected data structure member, but C isn't that
2457  * advanced...
2458  */
2459 hook_t *
2460 hook_alloc(const int h_version)
2461 {
2462 	hook_t *h;
2463 
2464 	h = kmem_zalloc(sizeof (hook_t), KM_SLEEP);
2465 	h->h_version = h_version;
2466 	return (h);
2467 }
2468 
2469 /*
2470  * Function:	hook_free
2471  * Returns:	None
2472  * Parameters:	h(I) - external hook pointer
2473  *
2474  * This function only free's memory allocated with hook_alloc(), so that if
2475  * (for example) kernel memory was allocated for h_name, this needs to be
2476  * free'd before calling hook_free().
2477  */
2478 void
2479 hook_free(hook_t *h)
2480 {
2481 	kmem_free(h, sizeof (*h));
2482 }
2483 
2484 /*
2485  * Function:	hook_notify_register
2486  * Returns:	int         - 0 = success, else failure
2487  * Parameters:	head(I)     - top of the list of callbacks
2488  *              callback(I) - function to be called
2489  *              arg(I)      - arg to pass back to the function
2490  *
2491  * This function implements the modification of the list of callbacks
2492  * that are registered when someone wants to be advised of a change
2493  * that has happened.
2494  */
2495 static int
2496 hook_notify_register(hook_notify_head_t *head, hook_notify_fn_t callback,
2497     void *arg)
2498 {
2499 	hook_notify_t *hn;
2500 
2501 	TAILQ_FOREACH(hn, head, hn_entry) {
2502 		if (hn->hn_func == callback) {
2503 			return (EEXIST);
2504 		}
2505 	}
2506 
2507 	hn = (hook_notify_t *)kmem_alloc(sizeof (*hn), KM_SLEEP);
2508 	hn->hn_func = callback;
2509 	hn->hn_arg = arg;
2510 	TAILQ_INSERT_TAIL(head, hn, hn_entry);
2511 
2512 	return (0);
2513 }
2514 
2515 /*
2516  * Function:	hook_notify_unregister
2517  * Returns:	int         - 0 = success, else failure
2518  * Parameters:	stackid(I)  - netstack identifier
2519  *              callback(I) - function to be called
2520  *              parg(O)     - pointer to storage for pointer
2521  *
2522  * When calling this function, the provision of a valid pointer in parg
2523  * allows the caller to be made aware of what argument the hook function
2524  * was expecting. This then allows the simulation of HN_UNREGISTER events
2525  * when a notify-unregister is performed.
2526  */
2527 static int
2528 hook_notify_unregister(hook_notify_head_t *head,
2529     hook_notify_fn_t callback, void **parg)
2530 {
2531 	hook_notify_t *hn;
2532 
2533 	ASSERT(parg != NULL);
2534 
2535 	TAILQ_FOREACH(hn, head, hn_entry) {
2536 		if (hn->hn_func == callback)
2537 			break;
2538 	}
2539 
2540 	if (hn == NULL)
2541 		return (ESRCH);
2542 
2543 	*parg = hn->hn_arg;
2544 
2545 	TAILQ_REMOVE(head, hn, hn_entry);
2546 
2547 	kmem_free(hn, sizeof (*hn));
2548 
2549 	return (0);
2550 }
2551 
2552 /*
2553  * Function:	hook_notify_run
2554  * Returns:	None
2555  * Parameters:	head(I)   - top of the list of callbacks
2556  *              family(I) - name of the hook family that owns the event
2557  *              event(I)  - name of the event being changed
2558  *              name(I)   - name of the object causing change
2559  *              cmd(I)    - either HN_UNREGISTER or HN_REGISTER
2560  *
2561  * This function walks through the list of registered callbacks and
2562  * executes each one, passing back the arg supplied when registered
2563  * and the name of the family (that owns the event), event (the thing
2564  * to which we're making a change) and finally a name that describes
2565  * what is being added or removed, as indicated by cmd.
2566  *
2567  * This function does not acquire or release any lock as it is required
2568  * that code calling it do so before hand.  The use of hook_notify_head_t
2569  * is protected by the use of flagwait_t in the structures that own this
2570  * list and with the use of the FWF_ADD/DEL_ACTIVE flags.
2571  */
2572 static void
2573 hook_notify_run(hook_notify_head_t *head, char *family, char *event,
2574     char *name, hook_notify_cmd_t cmd)
2575 {
2576 	hook_notify_t *hn;
2577 
2578 	TAILQ_FOREACH(hn, head, hn_entry) {
2579 		(*hn->hn_func)(cmd, hn->hn_arg, family, event, name);
2580 	}
2581 }
2582