xref: /titanic_52/usr/src/cmd/svc/startd/protocol.c (revision 2a8d6eba033e4713ab12b61178f0513f1f075482)
1 /*
2  * CDDL HEADER START
3  *
4  * The contents of this file are subject to the terms of the
5  * Common Development and Distribution License (the "License").
6  * You may not use this file except in compliance with the License.
7  *
8  * You can obtain a copy of the license at usr/src/OPENSOLARIS.LICENSE
9  * or http://www.opensolaris.org/os/licensing.
10  * See the License for the specific language governing permissions
11  * and limitations under the License.
12  *
13  * When distributing Covered Code, include this CDDL HEADER in each
14  * file and include the License file at usr/src/OPENSOLARIS.LICENSE.
15  * If applicable, add the following below this CDDL HEADER, with the
16  * fields enclosed by brackets "[]" replaced with your own identifying
17  * information: Portions Copyright [yyyy] [name of copyright owner]
18  *
19  * CDDL HEADER END
20  */
21 /*
22  * Copyright 2009 Sun Microsystems, Inc.  All rights reserved.
23  * Use is subject to license terms.
24  */
25 
26 /*
27  * protocol.c - protocols between graph engine and restarters
28  *
29  *   The graph engine uses restarter_protocol_send_event() to send a
30  *   restarter_event_type_t to the restarter.  For delegated restarters,
31  *   this is published on the GPEC queue for the restarter, which can
32  *   then be consumed by the librestart interfaces.  For services managed
33  *   by svc.startd, the event is stored on the local restarter_queue list,
34  *   where it can be dequeued by the restarter.
35  *
36  *   The svc.startd restarter uses graph_protocol_send_event() to send
37  *   a graph_event_type_t to the graph engine when an instance's states are
38  *   updated.
39  *
40  *   The graph engine uses restarter_protocol_init_delegate() to
41  *   register its interest in a particular delegated restarter's instance
42  *   state events.  The state_cb() registered on the event channel then
43  *   invokes graph_protocol_send_event() to communicate the update to
44  *   the graph engine.
45  */
46 
47 #include <assert.h>
48 #include <libintl.h>
49 #include <libsysevent.h>
50 #include <pthread.h>
51 #include <stdarg.h>
52 #include <stdio.h>
53 #include <strings.h>
54 #include <sys/time.h>
55 #include <errno.h>
56 #include <libuutil.h>
57 
58 #include <librestart.h>
59 #include <librestart_priv.h>
60 
61 #include "protocol.h"
62 #include "startd.h"
63 
64 /* Local event queue structures. */
65 typedef struct graph_protocol_event_queue {
66 	uu_list_t		*gpeq_event_list;
67 	pthread_mutex_t		gpeq_lock;
68 } graph_protocol_event_queue_t;
69 
70 typedef struct restarter_protocol_event_queue {
71 	uu_list_t		*rpeq_event_list;
72 	pthread_mutex_t		rpeq_lock;
73 } restarter_protocol_event_queue_t;
74 
75 static uu_list_pool_t *restarter_protocol_event_queue_pool;
76 static restarter_protocol_event_queue_t *restarter_queue;
77 
78 static uu_list_pool_t *graph_protocol_event_queue_pool;
79 static graph_protocol_event_queue_t *graph_queue;
80 
81 void
82 graph_protocol_init()
83 {
84 	graph_protocol_event_queue_pool = startd_list_pool_create(
85 	    "graph_protocol_events", sizeof (graph_protocol_event_t),
86 	    offsetof(graph_protocol_event_t, gpe_link), NULL,
87 	    UU_LIST_POOL_DEBUG);
88 
89 	graph_queue = startd_zalloc(sizeof (graph_protocol_event_queue_t));
90 
91 	(void) pthread_mutex_init(&graph_queue->gpeq_lock, &mutex_attrs);
92 	graph_queue->gpeq_event_list = startd_list_create(
93 	    graph_protocol_event_queue_pool, graph_queue, NULL);
94 }
95 
96 /*
97  * "data" will be freed by the consumer
98  */
99 static void
100 graph_event_enqueue(const char *inst, graph_event_type_t event,
101     protocol_states_t *data)
102 {
103 	graph_protocol_event_t *e;
104 
105 	e = startd_zalloc(sizeof (graph_protocol_event_t));
106 
107 	if (inst != NULL) {
108 		int size = strlen(inst) + 1;
109 		e->gpe_inst = startd_alloc(size);
110 		e->gpe_inst_sz = size;
111 		(void) strlcpy(e->gpe_inst, inst, size);
112 	}
113 	e->gpe_type = event;
114 	e->gpe_data = data;
115 
116 	(void) pthread_mutex_init(&e->gpe_lock, &mutex_attrs);
117 
118 	MUTEX_LOCK(&graph_queue->gpeq_lock);
119 	uu_list_node_init(e, &e->gpe_link, graph_protocol_event_queue_pool);
120 	if (uu_list_insert_before(graph_queue->gpeq_event_list, NULL, e) == -1)
121 		uu_die("failed to enqueue graph event (%s: %s)\n",
122 		    e->gpe_inst, uu_strerror(uu_error()));
123 
124 	MUTEX_UNLOCK(&graph_queue->gpeq_lock);
125 }
126 
127 void
128 graph_event_release(graph_protocol_event_t *e)
129 {
130 	uu_list_node_fini(e, &e->gpe_link, graph_protocol_event_queue_pool);
131 	(void) pthread_mutex_destroy(&e->gpe_lock);
132 	if (e->gpe_inst != NULL)
133 		startd_free(e->gpe_inst, e->gpe_inst_sz);
134 	startd_free(e, sizeof (graph_protocol_event_t));
135 }
136 
137 /*
138  * graph_protocol_event_t *graph_event_dequeue()
139  *   The caller must hold gu_lock, and is expected to be a single thread.
140  *   It is allowed to utilize graph_event_requeue() and abort processing
141  *   on the event. If graph_event_requeue() is not called, the caller is
142  *   expected to call graph_event_release() when finished.
143  */
144 graph_protocol_event_t *
145 graph_event_dequeue()
146 {
147 	graph_protocol_event_t *e;
148 
149 	MUTEX_LOCK(&graph_queue->gpeq_lock);
150 
151 	e = uu_list_first(graph_queue->gpeq_event_list);
152 	if (e == NULL) {
153 		MUTEX_UNLOCK(&graph_queue->gpeq_lock);
154 		return (NULL);
155 	}
156 
157 	if (uu_list_next(graph_queue->gpeq_event_list, e) != NULL)
158 		gu->gu_wakeup = 1;
159 	uu_list_remove(graph_queue->gpeq_event_list, e);
160 	MUTEX_UNLOCK(&graph_queue->gpeq_lock);
161 
162 	return (e);
163 }
164 
165 /*
166  * void graph_event_requeue()
167  *   Requeue the event back at the head of the queue.
168  */
169 void
170 graph_event_requeue(graph_protocol_event_t *e)
171 {
172 	assert(e != NULL);
173 
174 	log_framework(LOG_DEBUG, "Requeing event\n");
175 
176 	MUTEX_LOCK(&graph_queue->gpeq_lock);
177 	if (uu_list_insert_after(graph_queue->gpeq_event_list, NULL, e) == -1)
178 		uu_die("failed to requeue graph event (%s: %s)\n",
179 		    e->gpe_inst, uu_strerror(uu_error()));
180 
181 	MUTEX_UNLOCK(&graph_queue->gpeq_lock);
182 }
183 
184 void
185 graph_protocol_send_event(const char *inst, graph_event_type_t event,
186     protocol_states_t *data)
187 {
188 	graph_event_enqueue(inst, event, data);
189 	MUTEX_LOCK(&gu->gu_lock);
190 	gu->gu_wakeup = 1;
191 	(void) pthread_cond_broadcast(&gu->gu_cv);
192 	MUTEX_UNLOCK(&gu->gu_lock);
193 }
194 
195 void
196 restarter_protocol_init()
197 {
198 	restarter_protocol_event_queue_pool = startd_list_pool_create(
199 	    "restarter_protocol_events", sizeof (restarter_protocol_event_t),
200 	    offsetof(restarter_protocol_event_t, rpe_link), NULL,
201 	    UU_LIST_POOL_DEBUG);
202 
203 	restarter_queue = startd_zalloc(
204 	    sizeof (restarter_protocol_event_queue_t));
205 
206 	(void) pthread_mutex_init(&restarter_queue->rpeq_lock, &mutex_attrs);
207 	restarter_queue->rpeq_event_list = startd_list_create(
208 	    restarter_protocol_event_queue_pool, restarter_queue, NULL);
209 
210 	log_framework(LOG_DEBUG, "Initialized restarter protocol\n");
211 }
212 
213 /*
214  * void restarter_event_enqueue()
215  *   Enqueue a restarter event.
216  */
217 static void
218 restarter_event_enqueue(const char *inst, restarter_event_type_t event)
219 {
220 	restarter_protocol_event_t *e;
221 	int r;
222 
223 	/* Allocate and populate the event structure. */
224 	e = startd_zalloc(sizeof (restarter_protocol_event_t));
225 
226 	e->rpe_inst = startd_alloc(strlen(inst) + 1);
227 	(void) strlcpy(e->rpe_inst, inst, strlen(inst)+1);
228 	e->rpe_type = event;
229 
230 	MUTEX_LOCK(&restarter_queue->rpeq_lock);
231 	uu_list_node_init(e, &e->rpe_link, restarter_protocol_event_queue_pool);
232 	r = uu_list_insert_before(restarter_queue->rpeq_event_list, NULL, e);
233 	assert(r == 0);
234 
235 	MUTEX_UNLOCK(&restarter_queue->rpeq_lock);
236 
237 }
238 
239 void
240 restarter_event_release(restarter_protocol_event_t *e)
241 {
242 	uu_list_node_fini(e, &e->rpe_link, restarter_protocol_event_queue_pool);
243 	startd_free(e->rpe_inst, strlen(e->rpe_inst) + 1);
244 	startd_free(e, sizeof (restarter_protocol_event_t));
245 }
246 
247 /*
248  * restarter_protocol_event_t *restarter_event_dequeue()
249  *   Dequeue a restarter protocol event. The caller is expected to be
250  *   a single thread. It is allowed to utilize restarter_event_requeue()
251  *   and abort processing on the event. The caller is expected to call
252  *   restarter_event_release() when finished.
253  */
254 restarter_protocol_event_t *
255 restarter_event_dequeue()
256 {
257 	restarter_protocol_event_t *e = NULL;
258 
259 	MUTEX_LOCK(&restarter_queue->rpeq_lock);
260 
261 	e = uu_list_first(restarter_queue->rpeq_event_list);
262 	if (e == NULL) {
263 		MUTEX_UNLOCK(&restarter_queue->rpeq_lock);
264 		return (NULL);
265 	}
266 
267 	if (uu_list_next(restarter_queue->rpeq_event_list, e) != NULL)
268 		ru->restarter_update_wakeup = 1;
269 	uu_list_remove(restarter_queue->rpeq_event_list, e);
270 	MUTEX_UNLOCK(&restarter_queue->rpeq_lock);
271 
272 	return (e);
273 }
274 
275 static int
276 state_cb(sysevent_t *syse, void *cookie)
277 {
278 	char *fmri = (char *)cookie;
279 	char *instance_name;
280 	nvlist_t *attr_list = NULL;
281 	int state, next_state;
282 	char str_state[MAX_SCF_STATE_STRING_SZ];
283 	char str_next_state[MAX_SCF_STATE_STRING_SZ];
284 	protocol_states_t *states;
285 	int err;
286 	ssize_t sz;
287 
288 	/*
289 	 * Might fail due to a bad event or a lack of memory. Try
290 	 * the callback again to see if it goes better the next time.
291 	 */
292 	if (sysevent_get_attr_list(syse, &attr_list) != 0)
293 		return (EAGAIN);
294 
295 	if ((nvlist_lookup_int32(attr_list, RESTARTER_NAME_STATE,
296 	    &state) != 0) ||
297 	    (nvlist_lookup_int32(attr_list, RESTARTER_NAME_NEXT_STATE,
298 	    &next_state) != 0) ||
299 	    (nvlist_lookup_int32(attr_list, RESTARTER_NAME_ERROR, &err) != 0) ||
300 	    (nvlist_lookup_string(attr_list, RESTARTER_NAME_INSTANCE,
301 	    &instance_name) != 0))
302 		uu_die("%s: can't decode nvlist\n", fmri);
303 
304 	states = startd_alloc(sizeof (protocol_states_t));
305 	states->ps_state = state;
306 	states->ps_state_next = next_state;
307 	states->ps_err = err;
308 
309 	graph_protocol_send_event(instance_name, GRAPH_UPDATE_STATE_CHANGE,
310 	    states);
311 
312 	sz = restarter_state_to_string(state, str_state, sizeof (str_state));
313 	assert(sz < sizeof (str_state));
314 	sz = restarter_state_to_string(next_state, str_next_state,
315 	    sizeof (str_next_state));
316 	assert(sz < sizeof (str_next_state));
317 	log_framework(LOG_DEBUG, "%s: state updates for %s (%s, %s)\n", fmri,
318 	    instance_name, str_state, str_next_state);
319 	nvlist_free(attr_list);
320 	return (0);
321 }
322 
323 evchan_t *
324 restarter_protocol_init_delegate(char *fmri)
325 {
326 	char *delegate_channel_name, *master_channel_name, *sid;
327 	evchan_t *delegate_channel, *master_channel;
328 	int r = 0;
329 
330 	/* master restarter -- nothing to do */
331 	if (strcmp(fmri, SCF_SERVICE_STARTD) == 0) {
332 		uu_warn("Attempt to initialize restarter protocol delegate "
333 		    "with %s\n", fmri);
334 		return (NULL);
335 	}
336 
337 	log_framework(LOG_DEBUG, "%s: Intializing protocol for delegate\n",
338 	    fmri);
339 
340 	delegate_channel_name = master_channel_name = NULL;
341 	if ((delegate_channel_name = _restarter_get_channel_name(fmri,
342 	    RESTARTER_CHANNEL_DELEGATE)) == NULL ||
343 	    (master_channel_name = _restarter_get_channel_name(fmri,
344 	    RESTARTER_CHANNEL_MASTER)) == NULL ||
345 	    (sid = strdup("svc.startd")) == NULL) {
346 		if (delegate_channel_name) {
347 			free(delegate_channel_name);
348 		}
349 		if (master_channel_name) {
350 			free(master_channel_name);
351 		}
352 		uu_warn("Allocation of channel name failed");
353 
354 		return (NULL);
355 	}
356 
357 	if ((r = sysevent_evc_bind(delegate_channel_name, &delegate_channel,
358 	    EVCH_CREAT|EVCH_HOLD_PEND)) != 0) {
359 		uu_warn("%s: sysevent_evc_bind failed: %s\n",
360 		    delegate_channel_name, strerror(errno));
361 		goto out;
362 	}
363 
364 	if ((r = sysevent_evc_bind(master_channel_name, &master_channel,
365 	    EVCH_CREAT|EVCH_HOLD_PEND)) != 0) {
366 		uu_warn("%s: sysevent_evc_bind failed: %s\n",
367 		    master_channel_name, strerror(errno));
368 		goto out;
369 	}
370 
371 	log_framework(LOG_DEBUG,
372 	    "%s: Bound to channel %s (delegate), %s (master)\n", fmri,
373 	    delegate_channel_name, master_channel_name);
374 
375 	if ((r = sysevent_evc_subscribe(master_channel, sid, EC_ALL,
376 	    state_cb, fmri, EVCH_SUB_KEEP)) != 0) {
377 		/*
378 		 * The following errors can be returned in this
379 		 * case :
380 		 * 	EINVAL : inappropriate flags or dump flag
381 		 * 		and the dump failed.
382 		 * 	EEXIST : svc.startd already has a channel
383 		 * 		named as the master channel name
384 		 * 	ENOMEM : too many subscribers to the channel
385 		 */
386 		uu_warn("Failed to subscribe to restarter %s, channel %s with "
387 		    "subscriber id %s : \n", fmri, master_channel_name, sid);
388 		switch (r) {
389 		case EEXIST:
390 			uu_warn("Channel name already exists\n");
391 			break;
392 		case ENOMEM:
393 			uu_warn("Too many subscribers for the channel\n");
394 			break;
395 		default:
396 			uu_warn("%s\n", strerror(errno));
397 		}
398 	} else {
399 		log_framework(LOG_DEBUG,
400 		    "%s: Subscribed to channel %s with subscriber id %s\n",
401 		    fmri, master_channel_name, "svc.startd");
402 	}
403 
404 
405 out:
406 	free(delegate_channel_name);
407 	free(master_channel_name);
408 	free(sid);
409 
410 	if (r == 0)
411 		return (delegate_channel);
412 
413 	return (NULL);
414 }
415 
416 void
417 restarter_protocol_send_event(const char *inst, evchan_t *chan,
418     restarter_event_type_t event)
419 {
420 	nvlist_t *attr;
421 	int ret;
422 
423 	/*
424 	 * If the service is managed by the master restarter,
425 	 * queue the event locally.
426 	 */
427 	if (chan == NULL) {
428 		restarter_event_enqueue(inst, event);
429 		MUTEX_LOCK(&ru->restarter_update_lock);
430 		ru->restarter_update_wakeup = 1;
431 		(void) pthread_cond_broadcast(&ru->restarter_update_cv);
432 		MUTEX_UNLOCK(&ru->restarter_update_lock);
433 		return;
434 	}
435 
436 	/*
437 	 * Otherwise, send the event to the delegate.
438 	 */
439 	log_framework(LOG_DEBUG, "Sending %s to channel 0x%p for %s.\n",
440 	    event_names[event], chan, inst);
441 	if (nvlist_alloc(&attr, NV_UNIQUE_NAME, 0) != 0 ||
442 	    nvlist_add_uint32(attr, RESTARTER_NAME_TYPE, event) != 0 ||
443 	    nvlist_add_string(attr, RESTARTER_NAME_INSTANCE, (char *)inst) != 0)
444 		uu_die("Allocation failure\n");
445 
446 	if ((ret = restarter_event_publish_retry(chan, "protocol", "restarter",
447 	    "com.sun", "svc.startd", attr, EVCH_NOSLEEP)) != 0) {
448 
449 		switch (ret) {
450 		case ENOSPC:
451 			log_framework(LOG_DEBUG, "Dropping %s event for %s. "
452 			    "Delegate may not be running.\n",
453 			    event_names[event], inst);
454 			break;
455 		default:
456 			uu_die("%s: can't publish event: %s\n", inst,
457 			    strerror(errno));
458 		}
459 	}
460 
461 	nvlist_free(attr);
462 
463 	if (event != RESTARTER_EVENT_TYPE_ADD_INSTANCE) {
464 		/*
465 		 * Not relevant for graph loading.
466 		 */
467 		return;
468 	}
469 
470 	/*
471 	 * For the purposes of loading state after interruption, this is
472 	 * sufficient, as svc.startd(1M) won't receive events on the contracts
473 	 * associated with each delegate.
474 	 */
475 	MUTEX_LOCK(&st->st_load_lock);
476 	if (--st->st_load_instances == 0)
477 		(void) pthread_cond_broadcast(&st->st_load_cv);
478 	MUTEX_UNLOCK(&st->st_load_lock);
479 
480 }
481