static char OK_update[] = "1000 OK UpdateMedia\n";
/* Forward referenced functions */
-static int device_wait(JCR *jcr, DEVICE *dev, int wait_sec);
+static int wait_for_sysop(JCR *jcr, DEVICE *dev, int wait_sec);
/*
* Send current JobStatus to Director
static int do_request_volume_info(JCR *jcr)
{
BSOCK *dir = jcr->dir_bsock;
- VOLUME_CAT_INFO *vol = &jcr->VolCatInfo;
+ VOLUME_CAT_INFO vol;
jcr->VolumeName[0] = 0; /* No volume */
if (bnet_recv(dir) <= 0) {
Mmsg(&jcr->errmsg, _("Network error on bnet_recv in req_vol_info.\n"));
return 0;
}
- if (sscanf(dir->msg, OK_media, vol->VolCatName,
- &vol->VolCatJobs, &vol->VolCatFiles,
- &vol->VolCatBlocks, &vol->VolCatBytes,
- &vol->VolCatMounts, &vol->VolCatErrors,
- &vol->VolCatWrites, &vol->VolCatMaxBytes,
- &vol->VolCatCapacityBytes, vol->VolCatStatus,
- &vol->Slot, &vol->VolCatMaxJobs, &vol->VolCatMaxFiles) != 14) {
+ if (sscanf(dir->msg, OK_media, vol.VolCatName,
+ &vol.VolCatJobs, &vol.VolCatFiles,
+ &vol.VolCatBlocks, &vol.VolCatBytes,
+ &vol.VolCatMounts, &vol.VolCatErrors,
+ &vol.VolCatWrites, &vol.VolCatMaxBytes,
+ &vol.VolCatCapacityBytes, vol.VolCatStatus,
+ &vol.Slot, &vol.VolCatMaxJobs, &vol.VolCatMaxFiles) != 14) {
Dmsg1(200, "Bad response from Dir: %s\n", dir->msg);
Mmsg(&jcr->errmsg, _("Error scanning Dir response: %s\n"), dir->msg);
return 0;
}
- unbash_spaces(vol->VolCatName);
- pm_strcpy(&jcr->VolumeName, vol->VolCatName); /* set desired VolumeName */
+ unbash_spaces(vol.VolCatName);
+ pm_strcpy(&jcr->VolumeName, vol.VolCatName); /* set desired VolumeName */
+ memcpy(&jcr->VolCatInfo, &vol, sizeof(jcr->VolCatInfo));
Dmsg2(200, "do_reqest_vol_info got slot=%d Volume=%s\n",
- vol->Slot, vol->VolCatName);
+ vol.Slot, vol.VolCatName);
return 1;
}
unbash_spaces(vol->VolCatName);
if (bnet_recv(dir) <= 0) {
Dmsg0(190, "updateVolCatInfo error bnet_recv\n");
- Jmsg(jcr, M_ERROR, 0, _("Error updating Volume Info: %s\n"),
- bnet_strerror(dir));
+ Jmsg(jcr, M_ERROR, 0, _("Error updating Volume info Vol=\"%s\": ERR=%s\n"),
+ vol->VolCatName, bnet_strerror(dir));
return 0;
}
Dmsg1(120, "Updatevol: %s", dir->msg);
if (strcmp(dir->msg, OK_update) != 0) {
Dmsg1(130, "Bad response from Dir: %s\n", dir->msg);
- Jmsg(jcr, M_ERROR, 0, _("Error updating Volume Info: %s\n"), dir->msg);
+ Jmsg(jcr, M_ERROR, 0, _("Error updating Volume info Vol=\"%s\": %s\n"),
+ vol->VolCatName, dir->msg);
return 0;
}
return 1;
Dmsg1(100, "create_jobmedia(): %s", dir->msg);
if (bnet_recv(dir) <= 0) {
Dmsg0(190, "create_jobmedia error bnet_recv\n");
- Jmsg(jcr, M_ERROR, 0, _("Error creating JobMedia record: %s\n"),
+ Jmsg(jcr, M_ERROR, 0, _("Error creating JobMedia record: ERR=%s\n"),
bnet_strerror(dir));
return 0;
}
jcr->JobStatus = jstat;
dir_send_job_status(jcr);
- stat = device_wait(jcr, dev, wait_sec);
+ stat = wait_for_sysop(jcr, dev, wait_sec);
if (stat == ETIMEDOUT) {
wait_sec *= 2; /* double wait time */
jcr->JobStatus = JS_WaitMount;
dir_send_job_status(jcr);
- stat = device_wait(jcr, dev, wait_sec); /* wait on device */
+ stat = wait_for_sysop(jcr, dev, wait_sec); /* wait on device */
if (stat == ETIMEDOUT) {
wait_sec *= 2; /* double wait time */
return 1;
}
-#define HB_TIME 20*60 /* send a heatbeat once every 20 minutes while waiting */
-
-static int device_wait(JCR *jcr, DEVICE *dev, int wait_sec)
+/*
+ * Wait for SysOp to mount a tape
+ */
+static int wait_for_sysop(JCR *jcr, DEVICE *dev, int wait_sec)
{
struct timeval tv;
struct timezone tz;
time_t start = time(NULL);
time_t last_heartbeat = 0;
int stat = 0;
+ int add_wait;
/*
* Wait requested time (wait_sec). However, we also wake up every
* to keep stateful firewalls from closing them down while waiting
* for the operator.
*/
+ add_wait = wait_sec;
+ if (me->heartbeat_interval && add_wait > me->heartbeat_interval) {
+ add_wait = me->heartbeat_interval;
+ }
gettimeofday(&tv, &tz);
timeout.tv_nsec = tv.tv_usec * 1000;
- timeout.tv_sec = tv.tv_sec + (wait_sec > HB_TIME ? HB_TIME: wait_sec);
+ timeout.tv_sec = tv.tv_sec + add_wait;
P(dev->mutex);
dev_blocked = dev->dev_blocked;
dev->dev_blocked = BST_WAITING_FOR_SYSOP; /* indicate waiting for mount */
for ( ; !job_canceled(jcr); ) {
- int add_wait;
+ time_t now;
- Dmsg1(190, "I'm going to sleep on device %s\n", dev->dev_name);
+ Dmsg3(100, "I'm going to sleep on device %s. HB=%d wait=%d\n", dev->dev_name,
+ (int)me->heartbeat_interval, wait_sec);
stat = pthread_cond_timedwait(&dev->wait_next_vol, &dev->mutex, &timeout);
+ Dmsg1(100, "Wokeup from sleep on device stat=%d\n", stat);
+
+ now = time(NULL);
/* Note, this always triggers the first time. We want that. */
- time_t now = time(NULL);
- if (now - last_heartbeat >= HB_TIME) {
- /* send heartbeats */
- if (jcr->file_bsock) {
- bnet_sig(jcr->file_bsock, BNET_HEARTBEAT);
- }
- if (jcr->dir_bsock) {
- bnet_sig(jcr->dir_bsock, BNET_HEARTBEAT);
+ if (me->heartbeat_interval) {
+ if (now - last_heartbeat >= me->heartbeat_interval) {
+ /* send heartbeats */
+ if (jcr->file_bsock) {
+ bnet_sig(jcr->file_bsock, BNET_HEARTBEAT);
+ Dmsg0(100, "Send heartbeat to FD.\n");
+ }
+ if (jcr->dir_bsock) {
+ bnet_sig(jcr->dir_bsock, BNET_HEARTBEAT);
+ }
+ last_heartbeat = now;
}
- last_heartbeat = now;
}
- /* Check if we blocked the device */
- if (dev->dev_blocked == BST_WAITING_FOR_SYSOP) {
- if (stat != ETIMEDOUT) { /* we blocked the device */
- break; /* on error return */
- }
- if (now - start >= wait_sec) { /* on exceeding wait time return */
- break;
- }
- add_wait = wait_sec - (now - start);
- if (add_wait > HB_TIME) {
- add_wait = HB_TIME;
- }
- } else { /* Oops someone else has it blocked now */
- add_wait = 10; /* hang around until he releases it */
+ if (dev->dev_blocked == BST_MOUNT) { /* mount request ? */
+ stat = 0;
+ break;
+ }
+
+ if (stat != ETIMEDOUT) { /* we blocked the device */
+ break; /* on error return */
+ }
+ if (now - start >= wait_sec) { /* on exceeding wait time return */
+ Dmsg0(100, "Exceed wait time.\n");
+ break;
+ }
+ add_wait = wait_sec - (now - start);
+ if (me->heartbeat_interval && add_wait > me->heartbeat_interval) {
+ add_wait = me->heartbeat_interval;
}
- /*
- * Note, if dev_blocked is not BST_WAITING FOR_SYSOP,
- * someone other than us has blocked the device (probably the
- * user via the Console program), so we continue waiting
- * until he releases the device back to us.
- */
gettimeofday(&tv, &tz);
timeout.tv_nsec = tv.tv_usec * 1000;
timeout.tv_sec = tv.tv_sec + add_wait; /* additional wait */
+ Dmsg1(100, "Additional wait %d sec.\n", add_wait);
}
dev->dev_blocked = dev_blocked;