2 * Second generation Storage daemon.
4 * It accepts a number of simple commands from the File daemon
5 * and acts on them. When a request to append data is made,
6 * it opens a data channel and accepts data from the
13 Copyright (C) 2000-2005 Kern Sibbald
15 This program is free software; you can redistribute it and/or
16 modify it under the terms of the GNU General Public License as
17 published by the Free Software Foundation; either version 2 of
18 the License, or (at your option) any later version.
20 This program is distributed in the hope that it will be useful,
21 but WITHOUT ANY WARRANTY; without even the implied warranty of
22 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
23 General Public License for more details.
25 You should have received a copy of the GNU General Public
26 License along with this program; if not, write to the Free
27 Software Foundation, Inc., 59 Temple Place - Suite 330, Boston,
35 /* Imported functions */
38 /* Forward referenced functions */
39 void terminate_stored(int sig);
40 static void check_config();
42 extern "C" void *device_initialization(void *arg);
44 #define CONFIG_FILE "bacula-sd.conf" /* Default config file */
46 /* Global variables exported */
47 char OK_msg[] = "3000 OK\n";
48 char TERM_msg[] = "3999 Terminate\n";
49 STORES *me = NULL; /* our Global resource */
50 bool forge_on = false; /* proceed inspite of I/O errors */
51 pthread_mutex_t device_release_mutex = PTHREAD_MUTEX_INITIALIZER;
52 pthread_cond_t wait_device_release = PTHREAD_COND_INITIALIZER;
55 static uint32_t VolSessionId = 0;
56 uint32_t VolSessionTime;
59 /* Global static variables */
60 static int foreground = 0;
61 static pthread_mutex_t mutex = PTHREAD_MUTEX_INITIALIZER;
62 static workq_t dird_workq; /* queue for processing connections */
68 "Copyright (C) 2000-2005 Kern Sibbald.\n"
69 "\nVersion: " VERSION " (" BDATE ")\n\n"
70 "Usage: stored [options] [-c config_file] [config_file]\n"
71 " -c <file> use <file> as configuration file\n"
72 " -dnn set debug level to nn\n"
73 " -f run in foreground (for debugging)\n"
74 " -g <group> set groupid to group\n"
75 " -p proceed despite I/O errors\n"
76 " -s no signals (for debugging)\n"
77 " -t test - read config and exit\n"
78 " -u <user> userid to <user>\n"
79 " -v verbose user messages\n"
80 " -? print this message.\n"
85 /*********************************************************************
87 * Main Bacula Unix Storage Daemon
90 int main (int argc, char *argv[])
93 int no_signals = FALSE;
94 int test_config = FALSE;
100 my_name_is(argc, argv, "bacula-sd");
101 textdomain("bacula");
102 init_msg(NULL, NULL);
103 daemon_start_time = time(NULL);
106 if (TAPE_BSIZE % B_DEV_BSIZE != 0 || TAPE_BSIZE / B_DEV_BSIZE == 0) {
107 Emsg2(M_ABORT, 0, "Tape block size (%d) not multiple of system size (%d)\n",
108 TAPE_BSIZE, B_DEV_BSIZE);
110 if (TAPE_BSIZE != (1 << (ffs(TAPE_BSIZE)-1))) {
111 Emsg1(M_ABORT, 0, "Tape block size (%d) is not a power of 2\n", TAPE_BSIZE);
114 while ((ch = getopt(argc, argv, "c:d:fg:pstu:v?")) != -1) {
116 case 'c': /* configuration file */
117 if (configfile != NULL) {
120 configfile = bstrdup(optarg);
123 case 'd': /* debug level */
124 debug_level = atoi(optarg);
125 if (debug_level <= 0) {
130 case 'f': /* run in foreground */
134 case 'g': /* set group id */
138 case 'p': /* proceed in spite of I/O errors */
142 case 's': /* no signals */
150 case 'u': /* set uid */
154 case 'v': /* verbose */
168 if (configfile != NULL) {
171 configfile = bstrdup(*argv);
179 init_signals(terminate_stored);
182 if (configfile == NULL) {
183 configfile = bstrdup(CONFIG_FILE);
186 parse_config(configfile);
194 daemon_start(); /* become daemon */
195 init_stack_dump(); /* pick up new pid */
198 create_pid_file(me->pid_directory, "bacula-sd", get_first_port_host_order(me->sdaddrs));
199 read_state_file(me->working_directory, "bacula-sd", get_first_port_host_order(me->sdaddrs));
203 /* Ensure that Volume Session Time and Id are both
204 * set and are both non-zero.
206 VolSessionTime = (long)daemon_start_time;
207 if (VolSessionTime == 0) { /* paranoid */
208 Jmsg0(NULL, M_ABORT, 0, _("Volume Session Time is ZERO!\n"));
211 init_python_interpreter(me->hdr.name, me->scripts_directory, "SDStartUp");
213 /* Make sure on Solaris we can run concurrent, watch dog + servers + misc */
214 set_thread_concurrency(me->max_concurrent_jobs * 2 + 4);
217 * Start the device allocation thread
219 if (pthread_create(&thid, NULL, device_initialization, NULL) != 0) {
220 Emsg1(M_ABORT, 0, _("Unable to create thread. ERR=%s\n"), strerror(errno));
223 start_watchdog(); /* start watchdog thread */
225 init_jcr_subsystem(); /* start JCR watchdogs etc. */
228 * Sleep a bit to give device thread a chance to lock the resource
229 * chain before we start the server.
233 /* Single server used for Director and File daemon */
234 bnet_thread_server(me->sdaddrs, me->max_concurrent_jobs * 2 + 1,
235 &dird_workq, handle_connection_request);
236 exit(1); /* to keep compiler quiet */
239 /* Return a new Session Id */
240 uint32_t newVolSessionId()
251 /* Check Configuration file for necessary info */
252 static void check_config()
254 AUTOCHANGER *changer;
257 me = (STORES *)GetNextRes(R_STORAGE, NULL);
260 Jmsg1(NULL, M_ERROR_TERM, 0, _("No Storage resource defined in %s. Cannot continue.\n"),
263 my_name_is(0, (char **)NULL, me->hdr.name); /* Set our real name */
265 if (GetNextRes(R_STORAGE, (RES *)me) != NULL) {
267 Jmsg1(NULL, M_ERROR_TERM, 0, _("Only one Storage resource permitted in %s\n"),
270 if (GetNextRes(R_DIRECTOR, NULL) == NULL) {
272 Jmsg1(NULL, M_ERROR_TERM, 0, _("No Director resource defined in %s. Cannot continue.\n"),
275 if (GetNextRes(R_DEVICE, NULL) == NULL){
277 Jmsg1(NULL, M_ERROR_TERM, 0, _("No Device resource defined in %s. Cannot continue.\n"),
281 me->messages = (MSGS *)GetNextRes(R_MSGS, NULL);
283 Jmsg1(NULL, M_ERROR_TERM, 0, _("No Messages resource defined in %s. Cannot continue.\n"),
287 close_msg(NULL); /* close temp message handler */
288 init_msg(NULL, me->messages); /* open daemon message handler */
291 if (!me->working_directory) {
292 Jmsg1(NULL, M_ERROR_TERM, 0, _("No Working Directory defined in %s. Cannot continue.\n"),
295 set_working_directory(me->working_directory);
297 /* Ensure that the media_type for each device is the same */
298 foreach_res(changer, R_AUTOCHANGER) {
300 char *media_type = NULL;
301 foreach_alist(device, changer->device) {
302 if (media_type == NULL) {
303 media_type = device->media_type;
306 if (strcmp(media_type, device->media_type) != 0) {
307 Jmsg(NULL, M_ERROR_TERM, 0,
308 _("Media Type not the same for all devices in changer %s. Cannot continue.\n"),
312 * If the device does not have a changer name or changer command
313 * defined, used the one from the Autochanger resource
315 if (!device->changer_name) {
316 device->changer_name = bstrdup(changer->changer_name);
318 if (!device->changer_command) {
319 device->changer_command = bstrdup(changer->changer_command);
327 * Here we attempt to init and open each device. This is done
328 * once at startup in a separate thread.
331 void *device_initialization(void *arg)
336 pthread_detach(pthread_self());
338 foreach_res(device, R_DEVICE) {
339 Dmsg1(90, "calling init_dev %s\n", device->device_name);
340 device->dev = init_dev(NULL, NULL, device);
341 Dmsg1(10, "SD init done %s\n", device->device_name);
343 Jmsg1(NULL, M_ERROR, 0, _("Could not initialize %s\n"), device->device_name);
347 if (device->cap_bits & CAP_ALWAYSOPEN) {
348 Dmsg1(20, "calling first_open_device %s\n", device->device_name);
349 if (!first_open_device(device->dev)) {
350 Jmsg1(NULL, M_ERROR, 0, _("Could not open device %s\n"), device->device_name);
353 if (device->cap_bits & CAP_AUTOMOUNT && device->dev &&
354 device->dev->is_open()) {
357 jcr = new_jcr(sizeof(JCR), stored_free_jcr);
358 jcr->JobType = JT_SYSTEM;
359 /* Initialize FD start condition variable */
360 int errstat = pthread_cond_init(&jcr->job_start_wait, NULL);
362 Jmsg1(jcr, M_ABORT, 0, _("Unable to init job cond variable: ERR=%s\n"), strerror(errstat));
364 dcr = new_dcr(jcr, device->dev);
365 switch (read_dev_volume_label(dcr)) {
367 memcpy(&dcr->dev->VolCatInfo, &dcr->VolCatInfo, sizeof(dcr->dev->VolCatInfo));
370 Jmsg1(NULL, M_WARNING, 0, _("Could not mount device %s\n"), device->device_name);
381 /* Clean up and then exit */
382 void terminate_stored(int sig)
384 static bool in_here = false;
388 if (in_here) { /* prevent loops */
393 if (sig == SIGTERM) { /* normal shutdown request? */
395 * This is a normal shutdown request. We wiffle through
396 * all open jobs canceling them and trying to wake
397 * them up so that they will report back the correct
403 free_locked_jcr(jcr);
404 if (jcr->JobId == 0) {
405 continue; /* ignore console */
407 set_jcr_job_status(jcr, JS_Canceled);
408 fd = jcr->file_bsock;
410 fd->timed_out = true;
411 Dmsg1(100, "term_stored killing JobId=%d\n", jcr->JobId);
412 pthread_kill(jcr->my_thread_id, TIMEOUT_SIGNAL);
413 /* ***FIXME*** wiffle through all dcrs */
414 if (jcr->dcr && jcr->dcr->dev && jcr->dcr->dev->dev_blocked) {
415 pthread_cond_broadcast(&jcr->dcr->dev->wait_next_vol);
416 pthread_cond_broadcast(&wait_device_release);
418 bmicrosleep(0, 50000);
422 bmicrosleep(0, 500000); /* give them 1/2 sec to clean up */
425 write_state_file(me->working_directory, "bacula-sd", get_first_port_host_order(me->sdaddrs));
426 delete_pid_file(me->pid_directory, "bacula-sd", get_first_port_host_order(me->sdaddrs));
428 Dmsg1(200, "In terminate_stored() sig=%d\n", sig);
431 foreach_res(device, R_DEVICE) {
433 term_dev(device->dev);
440 free_config_resources();
442 if (debug_level > 10) {
443 print_memory_pool_stats();
449 sm_dump(false); /* dump orphaned buffers */