+
+/*
+ * Returns true if cleanup done and we should look for more work
+ */
+static bool reschedule_job(JCR *jcr, jobq_t *jq, jobq_item_t *je)
+{
+ bool resched = false;
+ /*
+ * Reschedule the job if requested and possible
+ */
+ /* Basic condition is that more reschedule times remain */
+ if (jcr->job->RescheduleTimes == 0 ||
+ jcr->reschedule_count < jcr->job->RescheduleTimes) {
+
+ /* Check for incomplete jobs */
+ if (jcr->is_incomplete()) {
+ resched = (jcr->RescheduleIncompleteJobs && jcr->is_JobType(JT_BACKUP) &&
+ !(jcr->HasBase||jcr->is_JobLevel(L_BASE)));
+ } else {
+ /* Check for failed jobs */
+ resched = (jcr->job->RescheduleOnError &&
+ !jcr->is_JobStatus(JS_Terminated) &&
+ !jcr->is_JobStatus(JS_Canceled) &&
+ jcr->is_JobType(JT_BACKUP));
+ }
+ }
+ if (resched) {
+ char dt[50], dt2[50];
+
+ /*
+ * Reschedule this job by cleaning it up, but
+ * reuse the same JobId if possible.
+ */
+ jcr->rerunning = jcr->is_incomplete(); /* save incomplete status */
+ time_t now = time(NULL);
+ jcr->reschedule_count++;
+ jcr->sched_time = now + jcr->job->RescheduleInterval;
+ bstrftime(dt, sizeof(dt), now);
+ bstrftime(dt2, sizeof(dt2), jcr->sched_time);
+ Dmsg4(2300, "Rescheduled Job %s to re-run in %d seconds.(now=%u,then=%u)\n", jcr->Job,
+ (int)jcr->job->RescheduleInterval, now, jcr->sched_time);
+ Jmsg(jcr, M_INFO, 0, _("Rescheduled Job %s at %s to re-run in %d seconds (%s).\n"),
+ jcr->Job, dt, (int)jcr->job->RescheduleInterval, dt2);
+ dird_free_jcr_pointers(jcr); /* partial cleanup old stuff */
+ jcr->JobStatus = -1;
+ jcr->setJobStatus(JS_WaitStartTime);
+ jcr->SDJobStatus = 0;
+ jcr->JobErrors = 0;
+ if (!allow_duplicate_job(jcr)) {
+ return false;
+ }
+ /* Only jobs with no output or Incomplete jobs can run on same JCR */
+ if (jcr->JobBytes == 0 || jcr->rerunning) {
+ Dmsg2(2300, "Requeue job=%d use=%d\n", jcr->JobId, jcr->use_count());
+ V(jq->mutex);
+ /*
+ * Special test here since a Virtual Full gets marked
+ * as a Full, so we look at the resource record
+ */
+ if (jcr->wasVirtualFull) {
+ jcr->setJobLevel(L_VIRTUAL_FULL);
+ }
+ /*
+ * When we are using the same jcr then make sure to reset
+ * RealEndTime back to zero.
+ */
+ jcr->jr.RealEndTime = 0;
+ jobq_add(jq, jcr); /* queue the job to run again */
+ P(jq->mutex);
+ free_jcr(jcr); /* release jcr */
+ free(je); /* free the job entry */
+ return true; /* we already cleaned up */
+ }
+ /*
+ * Something was actually backed up, so we cannot reuse
+ * the old JobId or there will be database record
+ * conflicts. We now create a new job, copying the
+ * appropriate fields.
+ */
+ JCR *njcr = new_jcr(sizeof(JCR), dird_free_jcr);
+ set_jcr_defaults(njcr, jcr->job);
+ /*
+ * Eliminate the new job_end_push, then copy the one from
+ * the old job, and set the old one to be empty.
+ */
+ void *v;
+ lock_jobs(); /* protect ourself from reload_config() */
+ LockRes();
+ foreach_alist(v, (&jcr->job_end_push)) {
+ njcr->job_end_push.append(v);
+ }
+ jcr->job_end_push.destroy();
+ jcr->job_end_push.init(1, false);
+ UnlockRes();
+ unlock_jobs();
+
+ njcr->reschedule_count = jcr->reschedule_count;
+ njcr->sched_time = jcr->sched_time;
+ njcr->initial_sched_time = jcr->initial_sched_time;
+ /*
+ * Special test here since a Virtual Full gets marked
+ * as a Full, so we look at the resource record
+ */
+ if (jcr->wasVirtualFull) {
+ njcr->setJobLevel(L_VIRTUAL_FULL);
+ } else {
+ njcr->setJobLevel(jcr->getJobLevel());
+ }
+ njcr->pool = jcr->pool;
+ njcr->run_pool_override = jcr->run_pool_override;
+ njcr->next_pool = jcr->next_pool;
+ njcr->run_next_pool_override = jcr->run_next_pool_override;
+ njcr->full_pool = jcr->full_pool;
+ njcr->vfull_pool = jcr->vfull_pool;
+ njcr->run_full_pool_override = jcr->run_full_pool_override;
+ njcr->run_vfull_pool_override = jcr->run_vfull_pool_override;
+ njcr->inc_pool = jcr->inc_pool;
+ njcr->run_inc_pool_override = jcr->run_inc_pool_override;
+ njcr->diff_pool = jcr->diff_pool;
+ njcr->JobStatus = -1;
+ njcr->setJobStatus(jcr->JobStatus);
+ if (jcr->rstore) {
+ copy_rstorage(njcr, jcr->rstorage, _("previous Job"));
+ } else {
+ free_rstorage(njcr);
+ }
+ if (jcr->wstore) {
+ copy_wstorage(njcr, jcr->wstorage, _("previous Job"));
+ } else {
+ free_wstorage(njcr);
+ }
+ njcr->messages = jcr->messages;
+ njcr->spool_data = jcr->spool_data;
+ njcr->write_part_after_job = jcr->write_part_after_job;
+ Dmsg0(2300, "Call to run new job\n");
+ V(jq->mutex);
+ run_job(njcr); /* This creates a "new" job */
+ free_jcr(njcr); /* release "new" jcr */
+ P(jq->mutex);
+ Dmsg0(2300, "Back from running new job.\n");
+ }
+ return false;
+}
+
+/*
+ * See if we can acquire all the necessary resources for the job (JCR)
+ *
+ * Returns: true if successful
+ * false if resource failure
+ */
+static bool acquire_resources(JCR *jcr)
+{
+ bool skip_this_jcr = false;
+
+ jcr->acquired_resource_locks = false;
+/*
+ * Turning this code off is likely to cause some deadlocks,
+ * but we do not really have enough information here to
+ * know if this is really a deadlock (it may be a dual drive
+ * autochanger), and in principle, the SD reservation system
+ * should detect these deadlocks, so push the work off on it.
+ */
+#ifdef xxx
+ if (jcr->rstore && jcr->rstore == jcr->wstore) { /* possible deadlock */
+ Jmsg(jcr, M_FATAL, 0, _("Job canceled. Attempt to read and write same device.\n"
+ " Read storage \"%s\" (From %s) -- Write storage \"%s\" (From %s)\n"),
+ jcr->rstore->name(), jcr->rstore_source, jcr->wstore->name(), jcr->wstore_source);
+ jcr->setJobStatus(JS_Canceled);
+ return false;
+ }
+#endif
+ if (jcr->rstore) {
+ Dmsg1(200, "Rstore=%s\n", jcr->rstore->name());
+ if (!inc_read_store(jcr)) {
+ Dmsg1(200, "Fail rncj=%d\n", jcr->rstore->getNumConcurrentJobs());
+ jcr->setJobStatus(JS_WaitStoreRes);
+ return false;
+ }
+ }
+
+ if (jcr->wstore) {
+ Dmsg1(200, "Wstore=%s\n", jcr->wstore->name());
+ int num = jcr->wstore->getNumConcurrentJobs();
+ if (num < jcr->wstore->MaxConcurrentJobs) {
+ Dmsg1(200, "Inc wncj=%d\n", num + 1);
+ jcr->wstore->setNumConcurrentJobs(num + 1);
+ } else if (jcr->rstore) {
+ dec_read_store(jcr);
+ skip_this_jcr = true;
+ } else {
+ Dmsg1(200, "Fail wncj=%d\n", num);
+ skip_this_jcr = true;
+ }
+ }
+ if (skip_this_jcr) {
+ jcr->setJobStatus(JS_WaitStoreRes);
+ return false;
+ }
+
+ if (jcr->client) {
+ if (jcr->client->getNumConcurrentJobs() < jcr->client->MaxConcurrentJobs) {
+ update_client_numconcurrentjobs(jcr, 1);
+ } else {
+ /* Back out previous locks */
+ dec_write_store(jcr);
+ dec_read_store(jcr);
+ jcr->setJobStatus(JS_WaitClientRes);
+ return false;
+ }
+ }
+ if (jcr->job->getNumConcurrentJobs() < jcr->job->MaxConcurrentJobs) {
+ int num;
+ num = jcr->job->getNumConcurrentJobs() + 1;
+ jcr->job->setNumConcurrentJobs(num);
+ } else {
+ /* Back out previous locks */
+ dec_write_store(jcr);
+ dec_read_store(jcr);
+ update_client_numconcurrentjobs(jcr, -1);
+ jcr->setJobStatus(JS_WaitJobRes);
+ return false;
+ }
+
+ jcr->acquired_resource_locks = true;
+ return true;
+}
+
+static pthread_mutex_t rstore_mutex = PTHREAD_MUTEX_INITIALIZER;
+
+/*
+ * Note: inc_read_store() and dec_read_store() are
+ * called from select_rstore() in src/dird/restore.c
+ */
+bool inc_read_store(JCR *jcr)
+{
+ P(rstore_mutex);
+ int num = jcr->rstore->getNumConcurrentJobs();
+ int numread = jcr->rstore->getNumConcurrentReadJobs();
+ int maxread = jcr->rstore->MaxConcurrentReadJobs;
+ if (num < jcr->rstore->MaxConcurrentJobs &&
+ (jcr->getJobType() == JT_RESTORE ||
+ numread == 0 ||
+ maxread == 0 || /* No limit set */
+ numread < maxread)) /* Below the limit */
+ {
+ num++;
+ numread++;
+ jcr->rstore->setNumConcurrentReadJobs(numread);
+ jcr->rstore->setNumConcurrentJobs(num);
+ Dmsg1(200, "Inc rncj=%d\n", num);
+ V(rstore_mutex);
+ return true;
+ }
+ V(rstore_mutex);
+ return false;
+}
+
+void dec_read_store(JCR *jcr)
+{
+ if (jcr->rstore) {
+ P(rstore_mutex);
+ int numread = jcr->rstore->getNumConcurrentReadJobs() - 1;
+ int num = jcr->rstore->getNumConcurrentJobs() - 1;
+ jcr->rstore->setNumConcurrentReadJobs(numread);
+ jcr->rstore->setNumConcurrentJobs(num);
+ Dmsg1(200, "Dec rncj=%d\n", num);
+ V(rstore_mutex);
+ }
+}
+
+static void dec_write_store(JCR *jcr)
+{
+ if (jcr->wstore) {
+ int num = jcr->wstore->getNumConcurrentJobs() - 1;
+ Dmsg1(200, "Dec wncj=%d\n", num);
+ jcr->wstore->setNumConcurrentJobs(num);
+ }
+}