/*
 * Copyright (C) 1994-2021 Altair Engineering, Inc.
 * For more information, contact Altair at www.altair.com.
 *
 * This file is part of both the OpenPBS software ("OpenPBS")
 * and the PBS Professional ("PBS Pro") software.
 *
 * Open Source License Information:
 *
 * OpenPBS is free software. You can redistribute it and/or modify it under
 * the terms of the GNU Affero General Public License as published by the
 * Free Software Foundation, either version 3 of the License, or (at your
 * option) any later version.
 *
 * OpenPBS is distributed in the hope that it will be useful, but WITHOUT
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
 * FITNESS FOR A PARTICULAR PURPOSE.  See the GNU Affero General Public
 * License for more details.
 *
 * You should have received a copy of the GNU Affero General Public License
 * along with this program.  If not, see <http://www.gnu.org/licenses/>.
 *
 * Commercial License Information:
 *
 * PBS Pro is commercially licensed software that shares a common core with
 * the OpenPBS software.  For a copy of the commercial license terms and
 * conditions, go to: (http://www.pbspro.com/agreement.html) or contact the
 * Altair Legal Department.
 *
 * Altair's dual-license business model allows companies, individuals, and
 * organizations to create proprietary derivative works of OpenPBS and
 * distribute them - whether embedded or bundled with other software -
 * under a commercial license agreement.
 *
 * Use of Altair's trademarks, including but not limited to "PBS™",
 * "OpenPBS®", "PBS Professional®", and "PBS Pro™" and Altair's logos is
 * subject to Altair's trademark licensing policies.
 */

/**
 * @file    node_info.c
 *
 * @brief
 * 		misc.c - This file contains functions related to node_info structure.
 *
 * Functions included are:
 * 	query_nodes()
 * 	query_node_info()
 * 	free_nodes()
 * 	set_node_info_state()
 * 	remove_node_state()
 * 	add_node_state()
 * 	node_filter()
 * 	find_node_info()
 * 	find_node_by_host()
 * 	dup_nodes()
 * 	dup_node_info()
 * 	copy_node_ptr_array()
 * 	collect_resvs_on_nodes()
 * 	collect_jobs_on_nodes()
 * 	update_node_on_run()
 * 	update_node_on_end()
 * 	check_rescspec()
 * 	search_for_rescspec()
 * 	dup_nspec()
 * 	free_nspecs()
 * 	find_nspec()
 * 	find_nspec_by_rank()
 * 	eval_selspec()
 * 	eval_placement()
 * 	eval_complex_selspec()
 * 	eval_simple_selspec()
 * 	is_vnode_eligible()
 * 	is_vnode_eligible_chunk()
 * 	resources_avail_on_vnode()
 * 	check_resources_for_node()
 * 	parse_placespec()
 * 	parse_selspec()
 * 	create_execvnode()
 * 	parse_execvnode()
 * 	node_state_to_str()
 * 	combine_nspec_array()
 * 	create_node_array_from_nspec()
 * 	reorder_nodes()
 * 	reorder_nodes_set()
 * 	ok_break_chunk()
 * 	is_excl()
 * 	alloc_rest_nodepart()
 * 	can_fit_on_vnode()
 * 	is_provisionable()
 * 	node_up_event()
 * 	node_down_event()
 * 	create_node_array_from_str()
 * 	find_node_by_rank()
 * 	new_node_scratch()
 * 	free_node_scratch()
 * 	sim_exclhost()
 * 	sim_exclhost_func()
 * 	set_current_aoe()
 * 	is_exclhost()
 * 	check_node_array_eligibility()
 * 	is_powerok()
 * 	is_eoe_avail_on_vnode()
 * 	set_current_eoe()
 *
 */

#include <unordered_map>

#include <pbs_config.h>

#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <math.h>
#include <ctype.h>
#include <sys/types.h>
#include <errno.h>
#include <math.h>
#include <errno.h>
#include <time.h>
#include <pbs_ifl.h>
#include <log.h>
#include <grunt.h>
#include <libutil.h>
#include <pbs_internal.h>
#include "attribute.h"
#include "node_info.h"
#include "server_info.h"
#include "job_info.h"
#include "misc.h"
#include "globals.h"
#include "check.h"
#include "constant.h"
#include "config.h"
#include "resource_resv.h"
#include "simulate.h"
#include "sort.h"
#include "node_partition.h"
#include "resource.h"
#include "pbs_internal.h"
#include "server_info.h"
#include "pbs_share.h"
#include "pbs_bitmap.h"
#include "pbs_license.h"
#include "multi_threading.h"
#ifdef NAS
#include "site_code.h"
#endif

/* name of the last node a job ran on - used in smp_dist = round robin */
static char last_node_name[PBS_MAXSVRJOBID];

void
query_node_info_chunk(th_data_query_ninfo *data)
{
	struct batch_status *nodes;
	struct batch_status *cur_node;
	node_info **ninfo_arr;
	server_info *sinfo;
	node_info *ninfo;
	int i;
	int nidx;
	int start;
	int end;
	int num_nodes_chunk;

	nodes = data->nodes;
	sinfo = data->sinfo;
	start = data->sidx;
	end = data->eidx;
	num_nodes_chunk = end - start + 1;

	if ((ninfo_arr = static_cast<node_info **>(malloc((num_nodes_chunk + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		data->error = 1;
		return;
	}
	ninfo_arr[0] = NULL;

	/* Move to the linked list item corresponding to the 'start' index */
	for (cur_node = nodes, i = 0; i < start && cur_node != NULL; cur_node = cur_node->next, i++)
		;

	for (i = start, nidx = 0; i <= end && cur_node != NULL; cur_node = cur_node->next, i++) {
		/* get node info from the batch_status */
		if ((ninfo = query_node_info(cur_node, sinfo)) == NULL) {
			free_nodes(ninfo_arr);
			data->error = 1;
			return;
		}

		if (node_in_partition(ninfo, sc_attrs.partition)) {
			ninfo_arr[nidx++] = ninfo;
		} else
			delete ninfo;
	}
	ninfo_arr[nidx] = NULL;

	data->oarr = ninfo_arr;
}

/**
 * @brief	Allocates th_data_query_ninfo for multi-threading of query_nodes
 *
 * @param[in]	nodes	-	batch_status of nodes queried from server
 * @param[in]	sinfo	-	server information
 * @param[in]	sidx	-	start index for the jobs list for the thread
 * @param[in]	eidx	-	end index for the jobs list for the thread
 *
 * @return th_data_query_ninfo *
 * @retval a newly allocated th_data_query_ninfo object
 * @retval NULL for malloc error
 */
static inline th_data_query_ninfo *
alloc_tdata_nd_query(struct batch_status *nodes, server_info *sinfo, int sidx, int eidx)
{
	th_data_query_ninfo *tdata;

	tdata = static_cast<th_data_query_ninfo *>(malloc(sizeof(th_data_query_ninfo)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->error = 0;
	tdata->nodes = nodes;
	tdata->oarr = NULL; /* Will be filled by the thread routine */
	tdata->sinfo = sinfo;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *      query_nodes - query all the nodes associated with a server
 *
 * @param[in]	pbs_sd	-	communication descriptor wit the pbs server
 * @param[in,out]	sinfo	-	server information
 *
 * @return	array of nodes associated with server
 *
 */
node_info **
query_nodes(int pbs_sd, server_info *sinfo)
{
	struct batch_status *nodes;    /* nodes returned from the server */
	struct batch_status *cur_node; /* used to cycle through nodes */
	node_info **ninfo_arr;	       /* array of nodes for scheduler's use */
	int num_nodes = 0;	       /* the number of nodes */
	int nidx = 0;
	static struct attrl *attrib = NULL;
	th_data_query_ninfo *tdata = NULL;
	th_task_info *task = NULL;
	node_info ***ninfo_arrs_tasks = NULL;
	int tid;

	if (attrib == NULL) {
		const char *nodeattrs[] = {
			ATTR_NODE_state,
			ATTR_NODE_Mom,
			ATTR_NODE_Port,
			ATTR_partition,
			ATTR_NODE_jobs,
			ATTR_NODE_ntype,
			ATTR_maxrun,
			ATTR_maxuserrun,
			ATTR_maxgrprun,
			ATTR_queue,
			ATTR_p,
			ATTR_NODE_Sharing,
			ATTR_NODE_License,
			ATTR_rescavail,
			ATTR_rescassn,
			ATTR_NODE_NoMultiNode,
			ATTR_ResvEnable,
			ATTR_NODE_ProvisionEnable,
			ATTR_NODE_current_aoe,
			ATTR_NODE_power_provisioning,
			ATTR_NODE_current_eoe,
			ATTR_NODE_in_multivnode_host,
			ATTR_NODE_last_state_change_time,
			ATTR_NODE_last_used_time,
			ATTR_NODE_resvs,
			NULL};

		for (int i = 0; nodeattrs[i] != NULL; i++) {
			struct attrl *temp_attrl;

			temp_attrl = new_attrl();
			temp_attrl->name = strdup(nodeattrs[i]);
			temp_attrl->next = attrib;
			temp_attrl->value = const_cast<char *>("");
			attrib = temp_attrl;
		}
	}

	/* get nodes from PBS server */
	if ((nodes = send_statvnode(pbs_sd, NULL, attrib, NULL)) == NULL) {
		auto err = pbs_geterrmsg(pbs_sd);
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO, "", "Error getting nodes: %s", err);
		return NULL;
	}

	cur_node = nodes;
	while (cur_node != NULL) {
		num_nodes++;
		cur_node = cur_node->next;
	}

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_nd_query(nodes, sinfo, 0, num_nodes - 1);
		if (tdata == NULL) {
			pbs_statfree(nodes);
			return NULL;
		}
		query_node_info_chunk(tdata);
		ninfo_arr = tdata->oarr;
		free(tdata);

		for (nidx = 0; ninfo_arr[nidx] != NULL; nidx++)
			ninfo_arr[nidx]->rank = get_sched_rank();

		ninfo_arr[nidx] = NULL;
	} else {
		int chunk_size = num_nodes / num_threads;
		int th_err = 0;
		int j;
		int num_tasks;
		if ((ninfo_arr = static_cast<node_info **>(malloc((num_nodes + 1) * sizeof(node_info *)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			pbs_statfree(nodes);
			return NULL;
		}
		ninfo_arr[0] = NULL;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		for (j = 0, num_tasks = 0; num_nodes > 0;
		     j += chunk_size, num_tasks++, num_nodes -= chunk_size) {
			tdata = alloc_tdata_nd_query(nodes, sinfo, j, j + chunk_size - 1);
			if (tdata == NULL) {
				th_err = 1;
				break;
			}
			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				log_err(errno, __func__, MEM_ERR_MSG);
				th_err = 1;
				break;
			}
			task->task_id = num_tasks;
			task->task_type = TS_QUERY_ND_INFO;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}
		ninfo_arrs_tasks = static_cast<node_info ***>(malloc(num_tasks * sizeof(node_info **)));
		if (ninfo_arrs_tasks == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			th_err = 1;
		}
		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_query_ninfo *>(task->thread_data);
				if (tdata->error)
					th_err = 1;
				ninfo_arrs_tasks[task->task_id] = tdata->oarr;
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
		if (th_err) {
			pbs_statfree(nodes);
			free_nodes(ninfo_arr);
			return NULL;
		}
		/* Assemble node info objects from various threads into the ninfo_arr */
		for (int i = 0; i < num_tasks; i++) {
			if (ninfo_arrs_tasks[i] != NULL) {
				node_info *ninfo;

				for (int j = 0; (ninfo = ninfo_arrs_tasks[i][j]) != NULL; j++) {
					ninfo->rank = get_sched_rank();
					ninfo_arr[nidx++] = ninfo;
				}
				free(ninfo_arrs_tasks[i]);
			}
		}
		ninfo_arr[nidx] = NULL;
		free(ninfo_arrs_tasks);
	}

	if (nidx == 0) {
		log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_SERVER, LOG_INFO, __func__,
			  "No nodes found in partitions serviced by scheduler");
		pbs_statfree(nodes);
		free(ninfo_arr);
		return NULL;
	}

#ifdef NAS /* localmod 062 */
	site_vnode_inherit(ninfo_arr);
#endif /* localmod 062 */
	resolve_indirect_resources(ninfo_arr);
	sinfo->num_nodes = nidx;
	pbs_statfree(nodes);
	return ninfo_arr;
}

/**
 * @brief
 *      query_node_info	- collect information from a batch_status and
 *      put it in a node_info struct for easier access
 *
 * @param[in]	node	-	a node returned from a pbs_statvnode() call
 * @param[in,out]	sinfo	-	server information
 *
 * @return	a node_info filled with information from node
 *
 */
node_info *
query_node_info(struct batch_status *node, server_info *sinfo)
{
	node_info *ninfo;     /* the new node_info */
	struct attrl *attrp;  /* used to cycle though attribute list */
	schd_resource *res;   /* used to set resources in res list */
	sch_resource_t count; /* used to convert str->num */
	char *endp;	      /* end pointer for strtol */
	int check_expiry = 0;
	time_t expiry = 0;

	if ((ninfo = new node_info(node->name)) == NULL)
		return NULL;

	attrp = node->attribs;

	ninfo->server = sinfo;

	while (attrp != NULL) {
		/* Node State... i.e. offline down free etc */
		if (!strcmp(attrp->name, ATTR_NODE_state))
			set_node_info_state(ninfo, attrp->value);

		/* Host name */
		else if (!strcmp(attrp->name, ATTR_NODE_Mom)) {
			if (ninfo->mom)
				free(ninfo->mom);
			if ((ninfo->mom = string_dup(attrp->value)) == NULL) {
				delete ninfo;
				return NULL;
			}
		} else if (!strcmp(attrp->name, ATTR_partition)) {
			ninfo->partition = string_dup(attrp->value);
			if (ninfo->partition == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				delete ninfo;
				return NULL;
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_jobs))
			ninfo->jobs = break_comma_list(attrp->value);
		else if (!strcmp(attrp->name, ATTR_maxrun)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->max_running = count;
		} else if (!strcmp(attrp->name, ATTR_maxuserrun)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->max_user_run = count;
			ninfo->has_hard_limit = 1;
		} else if (!strcmp(attrp->name, ATTR_maxgrprun)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->max_group_run = count;
			ninfo->has_hard_limit = 1;
		} else if (!strcmp(attrp->name, ATTR_queue))
			ninfo->queue_name = attrp->value;
		else if (!strcmp(attrp->name, ATTR_p)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->priority = count;
		} else if (!strcmp(attrp->name, ATTR_NODE_Sharing)) {
			ninfo->sharing = str_to_vnode_sharing(attrp->value);
			if (ninfo->sharing == VNS_UNSET) {
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO, ninfo->name,
					   "Unknown sharing type: %s using default shared", attrp->value);
				ninfo->sharing = VNS_DFLT_SHARED;
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_License)) {
			switch (attrp->value[0]) {
				case ND_LIC_TYPE_locked:
					ninfo->lic_lock = 1;
					break;
				case ND_LIC_TYPE_cloud:
					check_expiry = 1;
					break;
				default:
					log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
						   ninfo->name, "Unknown license type: %c", attrp->value[0]);
			}
		} else if (!strcmp(attrp->name, ATTR_rescavail)) {
			if (!strcmp(attrp->resource, ND_RESC_LicSignature)) {
				expiry = strtol(attrp->value, &endp, 10);
			}
			res = find_alloc_resource_by_str(ninfo->res, attrp->resource);

			if (res != NULL) {
				if (ninfo->res == NULL)
					ninfo->res = res;

				if (set_resource(res, attrp->value, RF_AVAIL) == 0) {
					delete ninfo;
					ninfo = NULL;
					break;
				}

				/* Round memory off to the nearest megabyte */
				if (res->def == allres["mem"])
					res->avail -= (long) res->avail % 1024;
#ifdef NAS /* localmod 034 */
				site_set_node_share(ninfo, res);
#endif /* localmod 034 */
			}
		} else if (!strcmp(attrp->name, ATTR_rescassn)) {
			res = find_alloc_resource_by_str(ninfo->res, attrp->resource);

			if (ninfo->res == NULL)
				ninfo->res = res;
			if (res != NULL) {
				if (set_resource(res, attrp->value, RF_ASSN) == 0) {
					delete ninfo;
					ninfo = NULL;
					break;
				}
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_NoMultiNode)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->no_multinode_jobs = 1;
		} else if (!strcmp(attrp->name, ATTR_ResvEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->resv_enable = 1;
		} else if (!strcmp(attrp->name, ATTR_NODE_ProvisionEnable)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->provision_enable = 1;
		} else if (!strcmp(attrp->name, ATTR_NODE_current_aoe)) {
			if (attrp->value != NULL)
				set_current_aoe(ninfo, attrp->value);
		} else if (!strcmp(attrp->name, ATTR_NODE_power_provisioning)) {
			if (!strcmp(attrp->value, ATR_TRUE))
				ninfo->power_provisioning = 1;
		} else if (!strcmp(attrp->name, ATTR_NODE_current_eoe)) {
			if (attrp->value != NULL)
				set_current_eoe(ninfo, attrp->value);
		} else if (!strcmp(attrp->name, ATTR_NODE_in_multivnode_host)) {
			if (attrp->value != NULL) {
				count = strtol(attrp->value, &endp, 10);
				if (*endp == '\0')
					ninfo->is_multivnoded = count;
				if ((!sinfo->has_multi_vnode) && (count != 0))
					sinfo->has_multi_vnode = 1;
			}
		} else if (!strcmp(attrp->name, ATTR_NODE_last_state_change_time)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->last_state_change_time = count;
		} else if (!strcmp(attrp->name, ATTR_NODE_last_used_time)) {
			count = strtol(attrp->value, &endp, 10);
			if (*endp == '\0')
				ninfo->last_used_time = count;
		} else if (!strcmp(attrp->name, ATTR_NODE_resvs)) {
			ninfo->resvs = break_comma_list(attrp->value);
		}
		attrp = attrp->next;
	}
	if (check_expiry) {
		if (time(NULL) < expiry)
			ninfo->lic_lock = 1;
	}

	if (ninfo->lic_lock != 1)
		ninfo->nscr |= NSCR_CYCLE_INELIGIBLE;

	return ninfo;
}

/**
 * @brief
 *	node_info constructor
 */
node_info::node_info(const std::string &nname) : name(nname)
{
	is_down = 0;
	is_free = 0;
	is_offline = 0;
	is_unknown = 0;
	is_exclusive = 0;
	is_job_exclusive = 0;
	is_resv_exclusive = 0;
	is_sharing = 0;
	is_busy = 0;
	is_job_busy = 0;
	is_stale = 0;
	is_maintenance = 0;
	is_provisioning = 0;
	is_sleeping = 0;
	is_multivnoded = 0;
	has_ghost_job = 0;

	lic_lock = 0;

	has_hard_limit = 0;
	no_multinode_jobs = 0;
	resv_enable = 0;
	provision_enable = 0;
	power_provisioning = 0;

	sharing = VNS_DFLT_SHARED;

	num_jobs = 0;
	num_run_resv = 0;
	num_susp_jobs = 0;

	priority = 0;

	rank = 0;

	nodesig_ind = -1;

	mom = NULL;
	jobs = NULL;
	resvs = NULL;
	job_arr = NULL;
	run_resvs_arr = NULL;
	res = NULL;
	server = NULL;

	max_running = SCHD_INFINITY;
	max_user_run = SCHD_INFINITY;
	max_group_run = SCHD_INFINITY;

	current_aoe = NULL;
	current_eoe = NULL;
	nodesig = NULL;
	last_state_change_time = 0;
	last_used_time = 0;

	svr_node = NULL;
	hostset = NULL;

	node_events = NULL;
	bucket_ind = -1;
	node_ind = -1;

	nscr = NSCR_NONE;

#ifdef NAS
	/* localmod 034 */
	sh_type = 0;
	sh_cls = 0;
#endif
	partition = NULL;
	np_arr = NULL;
}

/**
 * @brief	pthread routine for freeing up a node_info array
 *
 * @param[in,out]	data - th_data_free_ninfo wrapper for the ninfo array
 *
 * @return void
 */
void
free_node_info_chunk(th_data_free_ninfo *data)
{
	node_info **ninfo_arr;
	int start;
	int end;
	int i;

	ninfo_arr = data->ninfo_arr;
	start = data->sidx;
	end = data->eidx;

	for (i = start; i <= end && ninfo_arr[i] != NULL; i++) {
		delete ninfo_arr[i];
	}
}

/**
 * @brief	Allocates th_data_free_ninfo for multi-threading of free_nodes
 *
 * @param[in,out]	ninfo_arr	-	the node array to free
 * @param[in]	sidx	-	start index for the nodes array for the thread
 * @param[in]	eidx	-	end index for the nodes array for the thread
 *
 * @return th_data_free_ninfo *
 * @retval a newly allocated th_data_free_ninfo object
 * @retval NULL for malloc error
 */
static inline th_data_free_ninfo *
alloc_tdata_free_nodes(node_info **ninfo_arr, int sidx, int eidx)
{
	th_data_free_ninfo *tdata;

	tdata = static_cast<th_data_free_ninfo *>(malloc(sizeof(th_data_free_ninfo)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	tdata->ninfo_arr = ninfo_arr;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *		free_nodes - free all the nodes in a node_info array
 *
 * @param[in,out]	ninfo_arr - the node info array
 *
 * @return	nothing
 *
 */
void
free_nodes(node_info **ninfo_arr)
{
	int i;
	int chunk_size;
	th_data_free_ninfo *tdata = NULL;
	th_task_info *task = NULL;
	int num_tasks;
	int num_nodes;
	int tid;

	if (ninfo_arr == NULL)
		return;

	num_nodes = count_array(ninfo_arr);

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_free_nodes(ninfo_arr, 0, num_nodes - 1);
		if (tdata == NULL)
			return;

		free_node_info_chunk(tdata);
		free(tdata);
		free(ninfo_arr);
		return;
	}
	chunk_size = num_nodes / num_threads;
	chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
	for (i = 0, num_tasks = 0; num_nodes > 0;
	     num_tasks++, i += chunk_size, num_nodes -= chunk_size) {
		tdata = alloc_tdata_free_nodes(ninfo_arr, i, i + chunk_size - 1);
		if (tdata == NULL)
			break;

		task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
		if (task == NULL) {
			free(tdata);
			log_err(errno, __func__, MEM_ERR_MSG);
			break;
		}
		task->task_type = TS_FREE_ND_INFO;
		task->thread_data = (void *) tdata;

		queue_work_for_threads(task);
	}

	/* Get results from worker threads */
	for (i = 0; i < num_tasks;) {
		pthread_mutex_lock(&result_lock);
		while (ds_queue_is_empty(result_queue))
			pthread_cond_wait(&result_cond, &result_lock);
		while (!ds_queue_is_empty(result_queue)) {
			task = static_cast<th_task_info *>(ds_dequeue(result_queue));
			tdata = static_cast<th_data_free_ninfo *>(task->thread_data);
			free(tdata);
			free(task);
			i++;
		}
		pthread_mutex_unlock(&result_lock);
	}
	free(ninfo_arr);
}

/**
 * @brief
 *      node_info destructor
 */
node_info::~node_info()
{
	free(mom);
	free_string_array(jobs);
	free_string_array(resvs);
	free(job_arr);
	free(run_resvs_arr);
	free_resource_list(res);
	free_counts_list(group_counts);
	free_counts_list(user_counts);
	free(current_aoe);
	free(current_eoe);
	free(nodesig);
	free_te_list(node_events);
	free(partition);
	free(np_arr);
}

/**
 * @brief
 * 		set the node state info bits from a single or comma separated list of
 * 		states.
 *
 * @param[in]	ninfo	-	the node to set the state
 * @param[in]	state	-	the state string from the server
 *
 * @retval	0	: on success
 * @retval	1	: on failure
 */
int
set_node_info_state(node_info *ninfo, const char *state)
{
	if (ninfo != NULL && state != NULL) {
		char statebuf[256]; /* used to strtok() node states */
		char *tok;	    /* used with strtok() */
		char *saveptr;

		/* clear all states */
		ninfo->is_down = ninfo->is_free = ninfo->is_unknown = 0;
		ninfo->is_sharing = ninfo->is_busy = ninfo->is_job_busy = 0;
		ninfo->is_stale = ninfo->is_provisioning = ninfo->is_exclusive = 0;
		ninfo->is_resv_exclusive = ninfo->is_job_exclusive = 0;
		ninfo->is_sleeping = ninfo->is_maintenance = 0;

		strcpy(statebuf, state);
		tok = strtok_r(statebuf, ",", &saveptr);

		while (tok != NULL) {
			while (isspace((int) *tok))
				tok++;

			if (add_node_state(ninfo, tok) == 1)
				log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
					   ninfo->name, "Unknown Node State: %s", tok);

			tok = strtok_r(NULL, ",", &saveptr);
		}
		return 0;
	}

	return 1;
}

/**
 * @brief
 * 		Remove a node state
 *
 * @param[in]	node	-	The node being considered
 * @param[in]	state	-	The state to remove
 *
 * @par Side-Effects:
 * 		Handles node exclusivity in a special way.
 * 		If handling resv-exclusive, unset is_exclusive along
 * 		If handling job-exclusive, unset is_exclusive only if resv-exclusive isn't
 * 		set.
 *
 * @retval	0	: on success
 * @retval	1	: on failure
 */
int
remove_node_state(node_info *ninfo, const char *state)
{
	if (ninfo == NULL)
		return 1;

	if (!strcmp(state, ND_down))
		ninfo->is_down = 0;
	else if (!strcmp(state, ND_free))
		ninfo->is_free = 0;
	else if (!strcmp(state, ND_offline))
		ninfo->is_offline = 0;
	else if (!strcmp(state, ND_state_unknown))
		ninfo->is_unknown = 0;
	else if (!strcmp(state, ND_job_exclusive)) {
		ninfo->is_job_exclusive = 0;
		if (ninfo->is_resv_exclusive == 0)
			ninfo->is_exclusive = 0;
	} else if (!strcmp(state, ND_resv_exclusive)) {
		ninfo->is_resv_exclusive = 0;
		if (ninfo->is_job_exclusive == 0)
			ninfo->is_exclusive = 0;
	} else if (!strcmp(state, ND_job_sharing))
		ninfo->is_sharing = 0;
	else if (!strcmp(state, ND_busy))
		ninfo->is_busy = 0;
	else if (!strcmp(state, ND_jobbusy))
		ninfo->is_job_busy = 0;
	else if (!strcmp(state, ND_Stale))
		ninfo->is_stale = 0;
	else if (!strcmp(state, ND_prov))
		ninfo->is_provisioning = 0;
	else if (!strcmp(state, ND_wait_prov))
		ninfo->is_provisioning = 0;
	else if (!strcmp(state, ND_maintenance))
		ninfo->is_maintenance = 0;
	else {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
			   ninfo->name, "Unknown Node State: %s on remove operation", state);
		return 1;
	}

	/* If all state bits are turned off, the node state must be free */
	if (!ninfo->is_free && !ninfo->is_busy && !ninfo->is_exclusive && !ninfo->is_job_exclusive && !ninfo->is_resv_exclusive && !ninfo->is_offline && !ninfo->is_job_busy && !ninfo->is_stale && !ninfo->is_provisioning && !ninfo->is_sharing && !ninfo->is_unknown && !ninfo->is_down && !ninfo->is_maintenance)
		ninfo->is_free = 1;

	if (ninfo->is_free)
		ninfo->nscr &= ~NSCR_CYCLE_INELIGIBLE;
	else
		ninfo->nscr |= NSCR_CYCLE_INELIGIBLE;

	return 0;
}

/**
 * @brief
 * 		Add a node state
 *
 * @param[in]	node	-	The node being considered
 * @param[in]	state	-	The state to add
 *
 * @par Side-Effects:
 * 		Handle node exclusivity in a special way.
 * 		If handling resv-exclusive or job-exclusive, turn is_exclusive bit on.
 *
 * @retval	0	: on success
 * @retval	1	: on failure
 */
int
add_node_state(node_info *ninfo, const char *state)
{
	int set_free = 0;

	if (ninfo == NULL)
		return 1;

	if (!strcmp(state, ND_down))
		ninfo->is_down = 1;
	else if (!strcmp(state, ND_free)) {
		ninfo->is_free = 1;
		set_free = 1;
	} else if (!strcmp(state, ND_offline))
		ninfo->is_offline = 1;
	else if (!strcmp(state, ND_state_unknown) || !strcmp(state, ND_unresolvable))
		ninfo->is_unknown = 1;
	else if (!strcmp(state, ND_job_exclusive)) {
		ninfo->is_job_exclusive = 1;
		ninfo->is_exclusive = 1;
	} else if (!strcmp(state, ND_resv_exclusive)) {
		ninfo->is_resv_exclusive = 1;
		ninfo->is_exclusive = 1;
	} else if (!strcmp(state, ND_job_sharing))
		ninfo->is_sharing = 1;
	else if (!strcmp(state, ND_busy))
		ninfo->is_busy = 1;
	else if (!strcmp(state, ND_jobbusy))
		ninfo->is_job_busy = 1;
	else if (!strcmp(state, ND_Stale))
		ninfo->is_stale = 1;
	else if (!strcmp(state, ND_prov))
		ninfo->is_provisioning = 1;
	else if (!strcmp(state, ND_wait_prov))
		ninfo->is_provisioning = 1;
	else if (!strcmp(state, ND_maintenance))
		ninfo->is_maintenance = 1;
	else if (!strcmp(state, ND_sleep)) {
		if (ninfo->server->power_provisioning)
			ninfo->is_sleeping = 1;
	} else {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_INFO,
			   ninfo->name, "Unknown Node State: %s on add operation", state);
		return 1;
	}

	/* Remove the free state unless it was specifically the state being added */
	if (!set_free) {
		ninfo->is_free = 0;
		ninfo->nscr |= NSCR_CYCLE_INELIGIBLE;
	} else
		ninfo->nscr &= ~NSCR_CYCLE_INELIGIBLE;

	return 0;
}

/**
 * @brief
 *		node_filter - filter a node array and return a new filterd array
 *
 * @param[in]	nodes	-	the array to filter
 * @param[in]	size	-	size of nodes (<0 for function to figure it out)
 * @param[in]	filter_func	-	pointer to a function that will filter the nodes
 *								- returns 1: job will be added to filtered array
 *								- returns 0: job will NOT be added to filtered array
 * @param[in]	arg - an optional arg passed to filter_func
 * @param[in]	flags - describe how nodes are filtered
 *
 * @return pointer to filtered array
 *
 * @par
 * filter_func prototype: int func( node_info *, void * )
 *
 */
node_info **
node_filter(node_info **nodes, int size,
	    int (*filter_func)(node_info *, void *), void *arg, int flags)
{
	node_info **new_nodes = NULL; /* the new node array */
	node_info **new_nodes_tmp = NULL;
	int i, j;

	if (size < 0)
		size = count_array(nodes);

	if ((new_nodes = static_cast<node_info **>(malloc((size + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (i = 0, j = 0; i < size; i++) {
		if (filter_func(nodes[i], arg)) {
			new_nodes[j] = nodes[i];
			j++;
		}
	}
	new_nodes[j] = NULL;

	if (!(flags & FILTER_FULL)) {
		if ((new_nodes_tmp = static_cast<node_info **>(realloc(new_nodes, (j + 1) * sizeof(node_info *)))) == NULL)
			log_err(errno, __func__, MEM_ERR_MSG);
		else
			new_nodes = new_nodes_tmp;
	}
	return new_nodes;
}

/**
 * @brief find a node by string
 * @param[in] ninfo_arr - node array to search
 * @param[in] nodename - name of node to searh for
 * @return node_info *
 * @retval found node
 * @retval NULL if not found or on error
 */
node_info *
find_node_info(node_info **ninfo_arr, const std::string &nodename)
{
	int i;

	if (ninfo_arr == NULL)
		return NULL;

	for (i = 0; ninfo_arr[i] != NULL && nodename != ninfo_arr[i]->name; i++)
		;

	return ninfo_arr[i];
}

/**
 * @brief
 *		find_node_by_host - find a node by its host resource rather then
 *				its name -- will return first found vnode
 *
 * @param[in]	ninfo_arr	-	array of nodes to search
 * @param[in]	host	-	host of node to find
 *
 * @return	found node
 * @retval	NULL	: not found
 *
 */
node_info *
find_node_by_host(node_info **ninfo_arr, char *host)
{
	int i;

	if (ninfo_arr == NULL || host == NULL)
		return NULL;

	for (i = 0; ninfo_arr[i] != NULL; i++) {
		auto res = find_resource(ninfo_arr[i]->res, allres["host"]);
		if (res != NULL) {
			if (compare_res_to_str(res, host, CMP_CASELESS))
				break;
		}
	}

	return ninfo_arr[i];
}

/**
 * @brief	pthread routine to dup a chunk of nodes
 *
 * @param[in,out]	data - data associated with duping of the nodes
 *
 * @return void
 */
void
dup_node_info_chunk(th_data_dup_nd_info *data)
{
	int i;
	int start;
	int end;
	node_info **onodes;
	node_info **nnodes;
	server_info *nsinfo;
	unsigned int flags;

	start = data->sidx;
	end = data->eidx;
	onodes = data->onodes;
	nnodes = data->nnodes;
	nsinfo = data->nsinfo;
	data->error = 0;
	flags = data->flags;

	for (i = start; i <= end && data->onodes[i] != NULL; i++) {
		if ((nnodes[i] = dup_node_info(onodes[i], nsinfo, flags)) == NULL) {
			data->error = 1;
			return;
		}
	}
}

/**
 * @brief	Allocates th_data_dup_nd_info for multi-threading of dup_nodes
 *
 * @param[in]	flags	-	flags passed to dup_nodes
 * @param[in]	nsinfo	-	the new server
 * @param[in]	onodes	-	the array to duplicate
 * @param[out]	nnodes	-	the duplicated array
 * @param[in]	sidx	-	start index for the nodes list for the thread
 * @param[in]	eidx	-	end index for the nodes list for the thread
 *
 * @return th_data_dup_nd_info *
 * @retval a newly allocated th_data_dup_nd_info object
 * @retval NULL for malloc error
 */
static inline th_data_dup_nd_info *
alloc_tdata_dup_nodes(unsigned int flags, server_info *nsinfo, node_info **onodes, node_info **nnodes,
		      int sidx, int eidx)
{
	th_data_dup_nd_info *tdata;

	tdata = static_cast<th_data_dup_nd_info *>(malloc(sizeof(th_data_dup_nd_info)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->flags = flags;
	tdata->nsinfo = nsinfo;
	tdata->onodes = onodes;
	tdata->nnodes = nnodes;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 *		dup_nodes - duplicate an array of nodes
 *
 * @param[in]	onodes	-	the array to duplicate
 * @param[in]	nsinfo	-	the new server
 * @param[in]	flags	-	DUP_INDIRECT - duplicate
 * 				 			target resources, not indirect
 *
 * @return the duplicated array
 * @retval	NULL	: on error
 *
 */
node_info **
dup_nodes(node_info **onodes, server_info *nsinfo, unsigned int flags)
{
	node_info **nnodes;
	int num_nodes;
	int thread_node_ct_left;
	schd_resource *nres = NULL;
	schd_resource *ores = NULL;
	schd_resource *tres = NULL;
	node_info *ninfo = NULL;
	th_data_dup_nd_info *tdata = NULL;
	th_task_info *task = NULL;
	int th_err = 0;
	int tid;

	if (onodes == NULL || nsinfo == NULL)
		return NULL;

	num_nodes = thread_node_ct_left = count_array(onodes);

	if ((nnodes = static_cast<node_info **>(malloc((num_nodes + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_dup_nodes(flags, nsinfo, onodes, nnodes, 0, num_nodes - 1);
		if (tdata == NULL) {
			free_nodes(nnodes);
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}

		dup_node_info_chunk(tdata);
		th_err = tdata->error;
		free(tdata);
	} else { /* We are multithreading */
		int j;
		int num_tasks;
		int chunk_size = num_nodes / num_threads;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		for (j = 0, num_tasks = 0; thread_node_ct_left > 0;
		     num_tasks++, j += chunk_size, thread_node_ct_left -= chunk_size) {
			tdata = alloc_tdata_dup_nodes(flags, nsinfo, onodes, nnodes, j, j + chunk_size - 1);
			if (tdata == NULL) {
				th_err = 1;
				break;
			}
			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				th_err = 1;
				log_err(errno, __func__, MEM_ERR_MSG);
				break;
			}
			task->task_type = TS_DUP_ND_INFO;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}

		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_dup_nd_info *>(task->thread_data);
				if (tdata->error)
					th_err = 1;
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
	}

	if (th_err) {
		free_nodes(nnodes);
		return NULL;
	}
	nnodes[num_nodes] = NULL;

	if (!(flags & DUP_INDIRECT)) {
		for (int i = 0; nnodes[i] != NULL; i++) {
			/* since the node list we're duplicating may have indirect resources
			 * which point to resources not in our node list, we need to detect it
			 * if we are in this case, we'll redirect them locally
			 */
			nres = nnodes[i]->res;
			while (nres != NULL) {
				if (nres->indirect_vnode_name != NULL) {
					ninfo = find_node_info(nnodes, nres->indirect_vnode_name);
					/* we found the problem -- first time we see it, we set the value
					 * of THIS node to the indirect value.  We'll then set all the rest
					 * to point to THIS node.
					 */
					if (ninfo == NULL) {
						ninfo = find_node_info(onodes, nnodes[i]->name);
						ores = find_resource(ninfo->res, nres->def);
						if (ores->indirect_res != NULL) {
							char namebuf[1024];

							sprintf(namebuf, "@%s", nnodes[i]->name.c_str());
							for (int j = i + 1; nnodes[j] != NULL; j++) {
								tres = find_resource(nnodes[j]->res, nres->def);
								if (tres != NULL) {
									if (tres->indirect_vnode_name != NULL &&
									    !strcmp(nres->indirect_vnode_name,
										    nres->indirect_vnode_name)) {
										if (set_resource(tres, namebuf, RF_AVAIL) == 0) {
											free_nodes(nnodes);
											return NULL;
										}
									}
								}
							}
							if (set_resource(nres,
									 ores->indirect_res->orig_str_avail, RF_AVAIL) == 0) {
								free_nodes(nnodes);
								return NULL;
							}
							nres->assigned = ores->indirect_res->assigned;
						}
					}
				}
				nres = nres->next;
			}
		}
	}

	if (resolve_indirect_resources(nnodes) == 0) {
		free_nodes(nnodes);
		return NULL;
	}
	return nnodes;
}

/**
 * @brief
 *		dup_node_info - duplicate a node by creating a new one and coping all
 *		        the data into the new
 *
 * @param[in]	onode	-	the node to dup
 * @param[in]	nsinfo	-	the NEW server (i.e. duplicated)
 * @param[in]	flags	-	DUP_INDIRECT - duplicate target resources, not indirect
 *
 * @return	newly allocated and duped node
 *
 */
node_info *
dup_node_info(node_info *onode, server_info *nsinfo, unsigned int flags)
{
	node_info *nnode;

	if (onode == NULL)
		return NULL;

	if ((nnode = new node_info(onode->name)) == NULL)
		return NULL;

	nnode->server = nsinfo;
	nnode->mom = string_dup(onode->mom);
	nnode->queue_name = onode->queue_name;

	nnode->is_down = onode->is_down;
	nnode->is_free = onode->is_free;
	nnode->is_offline = onode->is_offline;
	nnode->is_unknown = onode->is_unknown;
	nnode->is_exclusive = onode->is_exclusive;
	nnode->is_job_exclusive = onode->is_job_exclusive;
	nnode->is_resv_exclusive = onode->is_resv_exclusive;
	nnode->is_sharing = onode->is_sharing;
	nnode->is_busy = onode->is_busy;
	nnode->is_job_busy = onode->is_job_busy;
	nnode->is_stale = onode->is_stale;
	nnode->is_maintenance = onode->is_maintenance;
	nnode->is_provisioning = onode->is_provisioning;
	nnode->is_multivnoded = onode->is_multivnoded;

	nnode->sharing = onode->sharing;

	nnode->lic_lock = onode->lic_lock;

	nnode->rank = onode->rank;

	nnode->has_hard_limit = onode->has_hard_limit;
	nnode->no_multinode_jobs = onode->no_multinode_jobs;
	nnode->resv_enable = onode->resv_enable;
	nnode->provision_enable = onode->provision_enable;
	nnode->power_provisioning = onode->power_provisioning;

	nnode->num_jobs = onode->num_jobs;
	nnode->num_run_resv = onode->num_run_resv;
	nnode->num_susp_jobs = onode->num_susp_jobs;

	nnode->priority = onode->priority;

	nnode->jobs = dup_string_arr(onode->jobs);
	nnode->resvs = dup_string_arr(onode->resvs);
	if (flags & DUP_INDIRECT)
		nnode->res = dup_ind_resource_list(onode->res);
	else
		nnode->res = dup_resource_list(onode->res);

	nnode->max_running = onode->max_running;
	nnode->max_user_run = onode->max_user_run;
	nnode->max_group_run = onode->max_group_run;

	nnode->group_counts = dup_counts_umap(onode->group_counts);
	nnode->user_counts = dup_counts_umap(onode->user_counts);

	set_current_aoe(nnode, onode->current_aoe);
	set_current_eoe(nnode, onode->current_eoe);
	nnode->nodesig = string_dup(onode->nodesig);
	nnode->nodesig_ind = onode->nodesig_ind;
	nnode->last_state_change_time = onode->last_state_change_time;
	nnode->last_used_time = onode->last_used_time;

	if (onode->svr_node != NULL)
		nnode->svr_node = find_node_by_indrank(nsinfo->nodes, onode->node_ind, onode->rank);

	/* Duplicate list of jobs and running reservations.
	 * If caller is server_info's copy constructor then nsinfo->resvs/jobs should be NULL,
	 * but running reservations and jobs are collected later in the caller.
	 * Otherwise, we collect running reservations or jobs here.
	 */
	nnode->run_resvs_arr = copy_resresv_array(onode->run_resvs_arr, nsinfo->resvs);
	nnode->job_arr = copy_resresv_array(onode->job_arr, nsinfo->jobs);

	/* If we are called from dup_server(), nsinfo->hostsets are NULL.
	 * They are not created yet.  Hostsets will be attached in dup_server()
	 */
	if (onode->hostset != NULL)
		nnode->hostset = find_node_partition_by_rank(nsinfo->hostsets,
							     onode->hostset->rank);

	nnode->bucket_ind = onode->bucket_ind;
	nnode->node_ind = onode->node_ind;

	nnode->nscr = onode->nscr;

	if (onode->partition != NULL) {
		nnode->partition = string_dup(onode->partition);
		if (nnode->partition == NULL) {
			delete nnode;
			return NULL;
		}
	}

	return nnode;
}

/**
 * @brief
 *		copy_node_ptr_array - copy an array of jobs using a different set of
 *			      of node pointer (same nodes, different array).
 *			      This means we have to use the names from the
 *			      first array and find them in the second array
 *
 *
 * @param[in]	oarr	-	the old array (filtered array)
 * @param[in]	narr	-	the new array (entire node array)
 *
 * @return	copied array
 * @retval	NULL	: on error
 *
 */
node_info **
copy_node_ptr_array(node_info **oarr, node_info **narr)
{
	int i;
	node_info **ninfo_arr;
	node_info *ninfo;

	if (oarr == NULL || narr == NULL)
		return NULL;

	for (i = 0; oarr[i] != NULL; i++)
		;

	if ((ninfo_arr = static_cast<node_info **>(malloc(sizeof(node_info *) * (i + 1)))) == NULL)
		return NULL;

	for (i = 0; oarr[i] != NULL; i++) {
		ninfo = find_node_by_indrank(narr, oarr[i]->node_ind, oarr[i]->rank);

		if (ninfo == NULL) {
			free(ninfo_arr);
			return NULL;
		}
		ninfo_arr[i] = ninfo;
	}
	ninfo_arr[i] = NULL;

	return ninfo_arr;
}

/**
 * @brief
 *		collect_resvs_on_nodes - collect all the running resvs from resv array
 *				on the nodes
 *
 * @param[in]	ninfo	-	the nodes to collect for
 * @param[in]	resresv_arr	-	the array of resvs to consider
 * @param[in]	size	-	the size (in number of pointers) of the resv array
 *
 * @return	int
 * @retval	1	: success
 * @retval	0	: failure
 *
 */
int
collect_resvs_on_nodes(node_info **ninfo_arr, resource_resv **resresv_arr, int size)
{
	int i;

	if (ninfo_arr == NULL || ninfo_arr[0] == NULL)
		return 0;

	for (i = 0; ninfo_arr[i] != NULL; i++) {
		ninfo_arr[i]->run_resvs_arr = resource_resv_filter(resresv_arr, size,
								   check_resv_running_on_node, ninfo_arr[i]->name.c_str(), 0);
		/* the count of running resvs on the node is set in query_reservations */
	}
	return 1;
}

/**
 * @brief
 *		collect_jobs_on_nodes - collect all the jobs in the job array on the
 *				nodes
 *
 * @param[in]	ninfo	-	the nodes to collect for
 * @param[in]	resresv_arr	-	the array of jobs to consider
 * @param[in]	size	-	the size (in number of pointers) of the job arrays
 * @param[in]	flags	-	to indicate whether to do ghost job detection
 *
 * @retval	1	: upon success
 * @retval	2	: if a job reported on nodes was not found in the job arrays
 * @retval	0	: upon failure
 *
 */
int
collect_jobs_on_nodes(node_info **ninfo_arr, resource_resv **resresv_arr, int size, int flags)
{
	char *ptr;			  /* used to find the '/' in the jobs array */
	resource_resv *job;		  /* find the job from the jobs array */
	resource_resv **susp_jobs = NULL; /* list of suspended jobs */
	node_info *node;		  /* used to store pointer of node in ninfo_arr */
	resource_resv **temp_ninfo_arr = NULL;

	if (ninfo_arr == NULL || ninfo_arr[0] == NULL)
		return 0;

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		if ((ninfo_arr[i]->job_arr = static_cast<resource_resv **>(malloc((size + 1) * sizeof(resource_resv *)))) == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		}
		ninfo_arr[i]->job_arr[0] = NULL;
	}

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		if (ninfo_arr[i]->jobs != NULL) {
			/* If there are no running jobs in the list and node reports a running job,
			 * mark that the node has ghost job
			 */
			if (size == 0 && (flags & DETECT_GHOST_JOBS)) {
				ninfo_arr[i]->has_ghost_job = 1;
				log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG, ninfo_arr[i]->name,
					  "Jobs reported running on node no longer exists or are not in running state");
			}

			int k = 0;
			for (int j = 0; ninfo_arr[i]->jobs[j] != NULL && k < size; j++) {
				/* jobs are in the format of node_name/sub_node.  We don't care about
				 * the subnode... we just want to populate the jobs on our node
				 * structure
				 */
				ptr = strchr(ninfo_arr[i]->jobs[j], '/');
				if (ptr != NULL)
					*ptr = '\0';

				job = find_resource_resv(resresv_arr, ninfo_arr[i]->jobs[j]);
				if ((job != NULL) && (!job->nspec_arr.empty())) {
					/* if a distributed job has more then one instance on this node
					 * it'll show up more then once.  If this is the case, we only
					 * want to have the job in our array once.
					 */
					if (find_resource_resv_by_indrank(ninfo_arr[i]->job_arr, -1, job->rank) == NULL) {
						if (ninfo_arr[i]->has_hard_limit) {
							counts *cts;
							cts = find_alloc_counts(ninfo_arr[i]->group_counts,
										job->group);
							update_counts_on_run(cts, job->resreq);

							cts = find_alloc_counts(ninfo_arr[i]->user_counts,
										job->user);
							update_counts_on_run(cts, job->resreq);
						}

						ninfo_arr[i]->job_arr[k] = job;
						k++;
						/* make the job array searchable with find_resource_resv */
						ninfo_arr[i]->job_arr[k] = NULL;
					}
				} else if (flags & DETECT_GHOST_JOBS) {
					/* Race Condition occurred: nodes were queried when a job existed.
					 * Jobs were queried when the job no longer existed.  Make note
					 * of it on the job so the node's resources_assigned values can be
					 * recalculated later.
					 */
					ninfo_arr[i]->has_ghost_job = 1;
					log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG, ninfo_arr[i]->name,
						   "Job %s reported running on node no longer exists or is not in running state",
						   ninfo_arr[i]->jobs[j]);
				}
			}
			ninfo_arr[i]->num_jobs = k;
		}
	}

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		temp_ninfo_arr = static_cast<resource_resv **>(realloc(ninfo_arr[i]->job_arr, (ninfo_arr[i]->num_jobs + 1) * sizeof(resource_resv *)));
		if (temp_ninfo_arr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return 0;
		} else {
			ninfo_arr[i]->job_arr = temp_ninfo_arr;
		}
		ninfo_arr[i]->job_arr[ninfo_arr[i]->num_jobs] = NULL;
	}

	susp_jobs = resource_resv_filter(resresv_arr,
					 count_array(resresv_arr), check_susp_job, NULL, 0);
	if (susp_jobs == NULL)
		return 0;

	for (int i = 0; susp_jobs[i] != NULL; i++) {
		if (susp_jobs[i]->ninfo_arr != NULL) {
			for (int j = 0; susp_jobs[i]->ninfo_arr[j] != NULL; j++) {
				/* resresv->ninfo_arr is merely a new list with pointers to server nodes.
				 * resresv->resv->resv_nodes is a new list with pointers to resv nodes
				 */
				node = find_node_info(ninfo_arr,
						      susp_jobs[i]->ninfo_arr[j]->name);
				if (node != NULL)
					node->num_susp_jobs++;
			}
		}
	}
	free(susp_jobs);

	return 1;
}

/**
 * @brief
 *		update_node_on_run - update internal scheduler node data when a
 *			     resource resv is run.
 *
 * @param[in]	nspec	-	the nspec for the node allocation
 * @param[in]	resresv -	the resource rev which ran
 * @param[in]  job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	nothing
 *
 */
void
update_node_on_run(nspec *ns, resource_resv *resresv, const char *job_state)
{
	resource_req *resreq;
	schd_resource *ncpusres = NULL;
	resource_resv **tmp_arr;
	node_info *ninfo;

	if (ns == NULL || resresv == NULL)
		return;

	ninfo = ns->ninfo;

	/* Don't account for resources of a node that is unavailable */
	if (ninfo->is_offline || ninfo->is_down)
		return;

	if (resresv->is_job) {
		ninfo->num_jobs++;
		if (find_resource_resv_by_indrank(ninfo->job_arr, resresv->resresv_ind, resresv->rank) == NULL) {
			tmp_arr = add_resresv_to_array(ninfo->job_arr, resresv, NO_FLAGS);
			if (tmp_arr == NULL)
				return;

			ninfo->job_arr = tmp_arr;
		}

	} else if (resresv->is_resv) {
		ninfo->num_run_resv++;
		if (find_resource_resv_by_indrank(ninfo->run_resvs_arr, resresv->resresv_ind, resresv->rank) == NULL) {
			tmp_arr = add_resresv_to_array(ninfo->run_resvs_arr, resresv, NO_FLAGS);
			if (tmp_arr == NULL)
				return;

			ninfo->run_resvs_arr = tmp_arr;
		}
	}

	resreq = ns->resreq;
	if ((job_state != NULL) && (*job_state == 'S')) {
		if (!resresv->job->resreleased.empty()) {
			nspec *temp = find_nspec_by_rank(resresv->job->resreleased, ninfo->rank);
			if (temp != NULL)
				resreq = temp->resreq;
		}
	}
	while (resreq != NULL) {
		if (resreq->type.is_consumable) {
			schd_resource *res;

			res = find_resource(ninfo->res, resreq->def);

			if (res != NULL) {
				if (res->indirect_res != NULL)
					res = res->indirect_res;

				res->assigned += resreq->amount;

				if (res->def == allres["ncpus"]) {
					ncpusres = res;
				}
			}
		}
		resreq = resreq->next;
	}

	if (ninfo->has_hard_limit && resresv->is_job) {
		counts *cts;

		cts = find_alloc_counts(ninfo->group_counts, resresv->group);
		update_counts_on_run(cts, ns->resreq);

		cts = find_alloc_counts(ninfo->user_counts, resresv->user);
		update_counts_on_run(cts, ns->resreq);
	}

	/* if we're a cluster node and we have no cpus available, we're job_busy */
	if (ncpusres == NULL)
		ncpusres = find_resource(ninfo->res, allres["ncpus"]);

	if (ncpusres != NULL) {
		if (dynamic_avail(ncpusres) == 0)
			set_node_info_state(ninfo, ND_jobbusy);
	}

	/* if node selected for provisioning, this node is no longer available */
	if (ns->go_provision == 1) {
		set_node_info_state(ninfo, ND_prov);

		/* for jobs inside reservation, update the server's node info as well */
		if (resresv->job != NULL && resresv->job->resv != NULL &&
		    ninfo->svr_node != NULL) {
			set_node_info_state(ninfo->svr_node, ND_prov);
		}

		set_current_aoe(ninfo, resresv->aoename);
	}

	/* if job has eoe setting this node gets current_eoe set */
	if (resresv->is_job && resresv->eoename != NULL)
		set_current_eoe(ninfo, resresv->eoename);

	if (is_excl(resresv->place_spec, ninfo->sharing)) {
		if (resresv->is_resv) {
			add_node_state(ninfo, ND_resv_exclusive);
		} else {
			add_node_state(ninfo, ND_job_exclusive);
			if (ninfo->svr_node != NULL)
				add_node_state(ninfo->svr_node, ND_job_exclusive);
		}
	}

	if (resresv->run_event != NULL)
		remove_te_list(&ninfo->node_events, resresv->run_event);

	if (ninfo->node_ind != -1 && ninfo->bucket_ind != -1) {
		node_bucket *bkt = ninfo->server->buckets[ninfo->bucket_ind];
		int ind = ninfo->node_ind;

		if (pbs_bitmap_get_bit(bkt->free_pool->truth, ind)) {
			pbs_bitmap_bit_off(bkt->free_pool->truth, ind);
			bkt->free_pool->truth_ct--;
		} else {
			pbs_bitmap_bit_off(bkt->busy_later_pool->truth, ind);
			bkt->busy_later_pool->truth_ct--;
		}

		pbs_bitmap_bit_on(bkt->busy_pool->truth, ind);
		bkt->busy_pool->truth_ct++;
	}
}

/**
 * @brief
 *		update_node_on_end - update a node when a resource resv ends
 *
 * @param[in]	ninfo	-	the node where the job was running
 * @param[in]	resresv -	the resource resv which is ending
 * @param[in]	job_state -	the old state of a job if resresv is a job
 *				If the old_state is found to be suspended
 *				then only resources that were released
 *				during suspension will be accounted.
 *
 * @return	nothing
 *
 */
void
update_node_on_end(node_info *ninfo, resource_resv *resresv, const char *job_state)
{
	resource_req *resreq = NULL;
	schd_resource *res = NULL;
	counts *cts;
	int ind;

	if (ninfo == NULL || resresv == NULL)
		return;

	/* Don't account for resources of a node that is unavailable */
	if (ninfo->is_offline || ninfo->is_down)
		return;

	if (resresv->is_job) {
		ninfo->num_jobs--;
		if (ninfo->num_jobs < 0)
			ninfo->num_jobs = 0;

		remove_resresv_from_array(ninfo->job_arr, resresv);
	} else if (resresv->is_resv) {
		ninfo->num_run_resv--;
		if (ninfo->num_run_resv < 0)
			ninfo->num_run_resv = 0;

		remove_resresv_from_array(ninfo->run_resvs_arr, resresv);
	}

	if (ninfo->is_job_busy)
		remove_node_state(ninfo, ND_jobbusy);
	if (is_excl(resresv->place_spec, ninfo->sharing)) {
		if (resresv->is_resv)
			remove_node_state(ninfo, ND_resv_exclusive);
		else {
			remove_node_state(ninfo, ND_job_exclusive);
			if (ninfo->svr_node != NULL)
				remove_node_state(ninfo->svr_node, ND_job_exclusive);
		}
	}

	for (auto ns : resresv->nspec_arr) {
		if (ns->ninfo == ninfo) {
			resreq = ns->resreq;
			if ((job_state != NULL) && (*job_state == 'S')) {
				if (!resresv->job->resreleased.empty()) {
					nspec *temp = find_nspec_by_rank(resresv->job->resreleased, ninfo->rank);
					if (temp != NULL)
						resreq = temp->resreq;
				}
			}
			while (resreq != NULL) {
				if (resreq->type.is_consumable) {
					res = find_resource(ninfo->res, resreq->def);
					if (res != NULL) {
						if (res->indirect_res != NULL)
							res = res->indirect_res;
						res->assigned -= resreq->amount;
						if (res->assigned < 0) {
							log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, ninfo->name,
								   "%s turned negative %.2lf, setting it to 0", res->name, res->assigned);
							res->assigned = 0;
						}
					}
				}
				resreq = resreq->next;
			}
			/* no soft limits on nodes... just hard limits */
			if (ninfo->has_hard_limit && resresv->is_job) {
				cts = find_counts(ninfo->group_counts, resresv->group);

				if (cts != NULL)
					update_counts_on_end(cts, ns->resreq);

				cts = find_counts(ninfo->user_counts, resresv->user);

				if (cts != NULL)
					update_counts_on_end(cts, ns->resreq);
			}
		}
	}

	ind = ninfo->node_ind;
	if (ind != -1 && ninfo->bucket_ind != -1 && ninfo->num_jobs == 0) {
		node_bucket *bkt = ninfo->server->buckets[ninfo->bucket_ind];

		if (ninfo->node_events == NULL) {
			pbs_bitmap_bit_on(bkt->free_pool->truth, ind);
			bkt->free_pool->truth_ct++;
		} else {
			pbs_bitmap_bit_on(bkt->busy_later_pool->truth, ind);
			bkt->busy_later_pool->truth_ct++;
		}
		pbs_bitmap_bit_off(bkt->busy_pool->truth, ind);
		bkt->busy_pool->truth_ct--;
	}
}

// constructor
nspec::nspec()
{
	end_of_chunk = 0;
	seq_num = 0;
	sub_seq_num = 0;
	go_provision = 0;
	ninfo = NULL;
	resreq = NULL;
	chk = NULL;
}

// destructor
nspec::~nspec()
{
	free_resource_req_list(resreq);
}

// copy constructor
nspec::nspec(const nspec &ons, node_info **ninfo_arr, selspec *sel)
{
	end_of_chunk = ons.end_of_chunk;
	seq_num = ons.seq_num;
	sub_seq_num = ons.sub_seq_num;
	go_provision = ons.go_provision;
	ninfo = find_node_by_indrank(ninfo_arr, ons.ninfo->node_ind, ons.ninfo->rank);
	resreq = dup_resource_req_list(ons.resreq);
	if (sel != NULL)
		chk = find_chunk_by_seq_num(sel->chunks, ons.seq_num);
}

/**
 * @brief
 * 		dup_nspecs - duplicate an array of nspecs
 *
 * @param[in]	onspecs		- the nspecs to duplicate
 * @param[in]	ninfo_arr	- the nodes corresponding to the nspecs
 * @param[in]	sel		- select spec to map nspecs to
 * @return	duplicated nspec array
 *
 */
std::vector<nspec *>
dup_nspecs(const std::vector<nspec *> &onspecs, node_info **ninfo_arr, selspec *sel)
{
	std::vector<nspec *> nnspecs;

	if (onspecs.empty() || ninfo_arr == NULL)
		return {};

	for (const auto &ns : onspecs)
		nnspecs.push_back(new nspec(*ns, ninfo_arr, sel));

	return nnspecs;
}

/**
 * @brief
 * 		free_nspecs - free a nspec array
 *
 * @param[in,out]	ns	-	the nspec array
 *
 * @return	nothing
 *
 */
void
free_nspecs(std::vector<nspec *> &nspec_arr)
{
	for (auto ns : nspec_arr)
		delete ns;
	nspec_arr.clear();
}

/**
 * @brief
 *		find_nspec - find an nspec in an array
 *
 * @param[in]	nspec_arr	-	the array of nspecs to search
 * @param[in]	ninfo	-	the node_info to find
 *
 * @return	the found nspec
 * @retval	NULL
 *
 */
nspec *
find_nspec(std::vector<nspec *> &nspec_arr, node_info *ninfo)
{
	if (ninfo == NULL)
		return NULL;
	for (const auto &ns : nspec_arr)
		if (ns->ninfo == ninfo)
			return ns;

	return NULL;
}

/**
 * @brief
 * 		find an nspec in an array by rank
 *
 * @param[in]	nspec_arr	-	the array of nspecs to search
 * @param[in]	rank	-	the unique integer identifier of the nspec/node to search for
 *
 * @return	the found nspec
 * @retval	NULL	: Error
 *
 */
nspec *
find_nspec_by_rank(std::vector<nspec *> &nspec_arr, int rank)
{
	for (const auto &ns : nspec_arr)
		if (ns->ninfo->rank == rank)
			return ns;

	return NULL;
}

/**
 *	@brief
 *		eval a select spec to see if it is satisfiable
 *
 * @param[in]	policy	  -	policy info
 * @param[in]	spec	  -	the select spec
 * @param[in]	placespec -	the placement spec (-l place)
 * @param[in]	ninfo_arr - 	array of nodes to satisfy the spec
 * @param[in]	nodepart  -	the node partition array for node grouping
 *		 	 	if NULL, we're not doing node grouping
 * @param[in]	resresv	  -	the resource resv the spec is from
 * @param[in]	flags	  -	flags to change functions behavior
 *	      			EVAL_OKBREAK - ok to break chunk up across vnodes
 *	      			EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	nspec_arr -	the node solution
 * @param[out]	err	  -	error structure to return error information
 *
 * @return	bool
 * @retval	true	  : 	if the nodespec can be satisfied
 * @retval	false	  : 	if not
 *
 */
bool
eval_selspec(status *policy, selspec *spec, place *placespec,
	     node_info **ninfo_arr, node_partition **nodepart, resource_resv *resresv,
	     unsigned int flags, std::vector<nspec *> &nspec_arr, schd_error *err)
{
	place *pl;
	int can_fit = 0;
	bool rc = false; /* 1 if resources are available, 0 if not */
	int pass_flags = NO_FLAGS;
	char reason[MAX_LOG_SIZE] = {0};
	int i = 0;
	static struct schd_error *failerr = NULL;

	if (spec == NULL || ninfo_arr == NULL || resresv == NULL || placespec == NULL)
		return false;
	/* Unsetting RETURN_ALL_ERR flag, because with this flag set resresv_can_fit_nodepart can return
	 * with multiple errors and the function only needs to see the first error it encounters.
	 */
	flags &= ~RETURN_ALL_ERR;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
	} else
		clear_schd_error(failerr);

	/* Remove visited, scattered and ineligible bits from ncsr for node searching
	 * Since statebusy is a per cycle bit, it shouldn't be changed
	 */
	for (i = 0; ninfo_arr[i] != NULL; i++)
		ninfo_arr[i]->nscr &= ~(NSCR_VISITED | NSCR_SCATTERED | NSCR_INELIGIBLE);

	pl = placespec;

	if (flags != NO_FLAGS)
		pass_flags = flags;

	check_node_array_eligibility(ninfo_arr, resresv, pl, err);

	if (failerr->status_code == SCHD_UNKWN)
		move_schd_error(failerr, err);
	clear_schd_error(err);

	/* If we are not node grouping or we only have 1 chunk packed onto a single
	 * host, then we should try and satisfy over all nodes in the list
	 *
	 * NOTE: pack && total_chunks == 1 may not be valid once chunks are
	 * broken into vchunks
	 */
	if (nodepart == NULL) {
		if (resresv->server->has_multi_vnode && ok_break_chunk(resresv, ninfo_arr))
			pass_flags |= EVAL_OKBREAK;

		rc = eval_placement(policy, spec, ninfo_arr, pl, resresv, pass_flags, nspec_arr, err);
		if (!rc)
			free_nspecs(nspec_arr);

		if (pass_flags & EVAL_EXCLSET)
			alloc_rest_nodepart(nspec_arr, ninfo_arr);

		if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
			move_schd_error(err, failerr);

		return rc;
	}

	/* Otherwise we're node grouping... */

	for (i = 0; nodepart[i] != NULL && rc == 0; i++) {
		clear_schd_error(err);
		if (resresv_can_fit_nodepart(policy, nodepart[i], resresv, flags, err)) {
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Evaluating placement set: %s", nodepart[i]->name);
			if (nodepart[i]->ok_break)
				pass_flags |= EVAL_OKBREAK;

			if (nodepart[i]->excl)
				pass_flags |= EVAL_EXCLSET;

			rc = eval_placement(policy, spec, nodepart[i]->ninfo_arr, pl,
					    resresv, pass_flags, nspec_arr, err);
			if (rc) {
				if (resresv->nodepart_name != NULL)
					free(resresv->nodepart_name);
				resresv->nodepart_name = string_dup(nodepart[i]->name);
				can_fit = 1;
				if (nodepart[i]->excl)
					alloc_rest_nodepart(nspec_arr, nodepart[i]->ninfo_arr);
			} else {
				free_nspecs(nspec_arr);
				if (failerr->status_code == SCHD_UNKWN)
					copy_schd_error(failerr, err);
			}
		} else {
			translate_fail_code(err, NULL, reason);
			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Placement set %s is too small: %s", nodepart[i]->name, reason);
			set_schd_error_codes(err, NOT_RUN, SET_TOO_SMALL);
			set_schd_error_arg(err, ARG1, "Placement");
#ifdef NAS /* localmod 031 */
			set_schd_error_arg(err, ARG2, "for resource model");
#else
			set_schd_error_arg(err, ARG2, nodepart[i]->name);
#endif /* localmod 031 */
			if (failerr->status_code == SCHD_UNKWN)
				copy_schd_error(failerr, err);
		}

		if (!can_fit && !rc &&
		    resresv_can_fit_nodepart(policy, nodepart[i], resresv, flags | COMPARE_TOTAL, err)) {
			can_fit = 1;
		}
		pass_flags = NO_FLAGS;
	}

	if (!can_fit) {
		if (flags & SPAN_PSETS) {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				  "Request won't fit into any placement sets, will use all nodes");
			resresv->can_not_fit = 1;
			if (resresv->server->has_multi_vnode && ok_break_chunk(resresv, ninfo_arr))
				pass_flags |= EVAL_OKBREAK;

			rc = eval_placement(policy, spec, ninfo_arr, pl, resresv, pass_flags, nspec_arr, err);
		} else {
			set_schd_error_codes(err, NEVER_RUN, CANT_SPAN_PSET);
			/* CANT_SPAN_PSET is more important than any other error we may have encountered -- keep it*/
			clear_schd_error(failerr);
			copy_schd_error(failerr, err);
		}
	}

	if (!rc)
		free_nspecs(nspec_arr);

	if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
		move_schd_error(err, failerr);

	return rc;
}

/**
 * @brief
 * 		handle the place spec for vnode placement of chunks
 *
 * @param[in] policy     - policy info
 * @param[in] spec       - the select spec
 * @param[in] ninfo_arr  - array of nodes to satisfy the spec
 * @param[in] pl         - parsed placement spec
 * @param[in] resresv    - the resource resv the spec if from
 * @param[in] flags	-	flags to change function's behavior
 *	      				EVAL_OKBREAK - ok to break chunk up across vnodes
 * @param[out]	nspec_arr	-	the node solution will be allocated and
 *				   				returned by this pointer by reference
 * @param[out]	err	-	error structure to return error information
 *
 * @return	bool
 * @retval	true	: if the selspec can be satisfied
 * @retval	false	: if not
 *
 */
bool
eval_placement(status *policy, selspec *spec, node_info **ninfo_arr, place *pl,
	       resource_resv *resresv, unsigned int flags,
	       std::vector<nspec *> &nspec_arr, schd_error *err)
{
	np_cache *npc = NULL;
	node_partition **hostsets = NULL;
	int tot = 0;
	resource_req *req = NULL;
	schd_resource *res = NULL;
	selspec *dselspec = NULL;
	node_info **nptr = NULL;
	static schd_error *failerr = NULL;

	if (spec == NULL || ninfo_arr == NULL || pl == NULL || resresv == NULL)
		return 0;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return 0;
		}
	} else
		clear_schd_error(failerr);

	/* reorder nodes for smp_cluster_dist or avoid_provision.
	 *
	 * remark: reorder_nodes doesn't reorder in place, returns
	 *         a ptr to a reordered static array
	 */
	if ((pl->pack && spec->total_chunks == 1) ||
	    (conf.provision_policy == AVOID_PROVISION && resresv->aoename != NULL))
		nptr = reorder_nodes(ninfo_arr, resresv);

	if (nptr == NULL)
		nptr = ninfo_arr;

	/*
	 * eval_complex_selspec() handles placement for single vnoded systems.
	 * it should be merged into this function in a optimized way, but until
	 * we short circuit this function and fall into it.  This function doesn't
	 * handle multi-chunk pack.  We still fall into it in the case of a single
	 * chunk.
	 */
	if (!resresv->server->has_multi_vnode &&
	    (!resresv->place_spec->pack || spec->total_chunks == 1)) {
		return eval_complex_selspec(policy, spec, nptr, pl, resresv, flags, nspec_arr, err);
	}

	/* get a pool of node partitions based on host.  If we're using the
	 * server's nodes, we can use the pre-created host sets.
	 */
	if (nptr == resresv->server->nodes)
		hostsets = resresv->server->hostsets;

	if (hostsets == NULL) {
		std::vector<std::string> host_arr{"host"};
		npc = find_alloc_np_cache(policy, resresv->server->npc_arr, host_arr, nptr, NULL);
		if (npc != NULL)
			hostsets = npc->nodepart;
	}

	if (hostsets != NULL) {
		if (pl->scatter || pl->vscatter || pl->free) {
			dselspec = new selspec(*spec);
			if (dselspec == NULL)
				return false;
		}

		for (int i = 0; hostsets[i] != NULL && tot != spec->total_chunks; i++) {
			/* if one vnode on a host is set to force/dflt exclhost
			 * then they all are.  The mom makes sure of this
			 */
			std::vector<nspec *> nsa;
			node_info **dninfo_arr = hostsets[i]->ninfo_arr;
			enum vnode_sharing sharing = VNS_DFLT_SHARED;
			bool do_exclhost = false;
			bool rc = false; /* true if current chunk was successfully allocated */
			/* true if any vnode is allocated from a host - used in exclhost allocation */
			bool any_succ_rc = false;

			if (dninfo_arr[0] != NULL)
				sharing = dninfo_arr[0]->sharing;

			flags &= ~EVAL_EXCLSET;
			if (sharing == VNS_FORCE_EXCLHOST ||
			    (sharing == VNS_DFLT_EXCLHOST && pl->excl == 0 && pl->share == 0) || pl->exclhost) {
				do_exclhost = true;
				flags |= EVAL_EXCLSET;
			}

			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				   resresv->name, "Evaluating host %s", hostsets[i]->res_val);

			/* Pack on One Host Placement:
			 * place all chunks on one host.  This is done with a call to
			 * to eval_complex_selspec().
			 */
			if (pl->pack) {
				rc = eval_complex_selspec(policy, spec, dninfo_arr, pl,
							  resresv, flags | EVAL_OKBREAK, nsa, err);
				if (rc) {
					any_succ_rc = true;
					tot = spec->total_chunks;
				} else {
					free_nspecs(nsa);
					if (failerr->status_code == SCHD_UNKWN)
						move_schd_error(failerr, err);
					clear_schd_error(err);
				}
			}
			/* Scatter by Vnode Placement:
			 * place at most one chunk on any one vnode.  This is done by successive
			 * calls to to eval_simple_selspec().  If it returns true, we remove the
			 * vnode from dninfo_arr[] so we don't allocate it again.
			 */
			else if (pl->vscatter) {
				for (int c = 0; dselspec->chunks[c] != NULL; c++) {
					/* setting rc=1 forces at least 1 loop of the while.  This should be
					 * be rewritten in the do/while() style seen in the free block below
					 */
					rc = true;
					if ((hostsets[i]->free_nodes > 0) && (check_avail_resources(hostsets[i]->res,
												    dselspec->chunks[c]->req, UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err))) {
						for (int k = 0; dninfo_arr[k] != NULL; k++)
							dninfo_arr[k]->nscr &= ~NSCR_VISITED;
						while (rc && dselspec->chunks[c]->num_chunks > 0) {
							std::vector<nspec *> ns_chunk;
							rc = eval_simple_selspec(policy, spec->chunks[c], dninfo_arr, pl,
										 resresv, flags, ns_chunk, err);

							if (rc) {
								any_succ_rc = true;
								tot++;
								dselspec->chunks[c]->num_chunks--;

								for (const auto &ns : ns_chunk) {
									auto vn = find_node_by_rank(dninfo_arr, ns->ninfo->rank);
									if (vn != NULL)
										vn->nscr |= NSCR_SCATTERED;
								}
								nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
							} else {
								free_nspecs(ns_chunk);
								if (failerr->status_code == SCHD_UNKWN)
									move_schd_error(failerr, err);
								clear_schd_error(err);
							}
						}
					} else {
						char reason[MAX_LOG_SIZE] = {0};

						if (hostsets[i]->free_nodes == 0)
							strcpy(reason, "No free nodes available");
						else
							translate_fail_code(err, NULL, reason);

						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							   resresv->name, "Insufficient host-level resources %s", reason);

						/* don't be so specific in the comment since it's only for a single host */
						set_schd_error_arg(err, ARG1, NULL);

						if (failerr->status_code == SCHD_UNKWN)
							move_schd_error(failerr, err);
						clear_schd_error(err);
					}
				}
			}
			/* Scatter By Host Placement:
			* place at most one chunk on any one host.  We make a call to
			* eval_simple_selspec() for each sub-chunk (things between the +'s).
			* If it returns success (i.e. rc=1) we are done for this host
			*/
			else if (pl->scatter) {
				for (int c = 0; dselspec->chunks[c] != NULL && rc == 0; c++) {
					if ((hostsets[i]->free_nodes > 0) && (check_avail_resources(hostsets[i]->res,
												    dselspec->chunks[c]->req, UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err))) {
						std::vector<nspec *> ns_chunk;

						if (dselspec->chunks[c]->num_chunks > 0) {
							for (int k = 0; dninfo_arr[k] != NULL; k++)
								dninfo_arr[k]->nscr &= ~NSCR_VISITED;

							rc = eval_simple_selspec(policy, spec->chunks[c],
										 dninfo_arr, pl, resresv, flags | EVAL_OKBREAK,
										 ns_chunk, err);

							if (rc) {
								any_succ_rc = 1;
								tot++;
								dselspec->chunks[c]->num_chunks--;
								nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
							} else {
								free_nspecs(ns_chunk);

								if (failerr->status_code == SCHD_UNKWN)
									move_schd_error(failerr, err);
								clear_schd_error(err);
							}
						}
					} else {
						char reason[MAX_LOG_SIZE] = {0};

						if (hostsets[i]->free_nodes == 0)
							strcpy(reason, "No free nodes available");
						else
							translate_fail_code(err, NULL, reason);

						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							   resresv->name, "Insufficient host-level resources %s", reason);

						/* don't be so specific in the comment since it's only for a single host */
						set_schd_error_arg(err, ARG1, NULL);

						if (failerr->status_code == SCHD_UNKWN)
							move_schd_error(failerr, err);
						clear_schd_error(err);
					}
				}
			}
			/* Free Placement:
			 * Place as many chunks as possible on vnodes as they can hold.
			 * We do this by duplicating both the nodes and the select spec.  The
			 * resources and chunks counts are decremented in the duplicated select
			 * when they are allocated.  The assigned resources on the nodes are
			 * increased when resources are allocated.  When the select spec has no
			 *  more resources left, we've successfully fulfilled the request.  If we
			 * run out of nodes to search, then we've failed to fulfill the request.
			 */
			else if (pl->free) {
				node_info **dup_ninfo_arr;
				dup_ninfo_arr = dup_nodes(hostsets[i]->ninfo_arr,
							  resresv->server, NO_FLAGS);
				if (dup_ninfo_arr == NULL) {
					delete dselspec;
					return 0;
				}

				for (int c = 0; dselspec->chunks[c] != NULL; c++) {
					if ((hostsets[i]->free_nodes > 0) && (check_avail_resources(hostsets[i]->res,
												    dselspec->chunks[c]->req, UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err))) {
						if (dselspec->chunks[c]->num_chunks > 0) {
							for (int k = 0; dup_ninfo_arr[k] != NULL; k++)
								dup_ninfo_arr[k]->nscr &= ~NSCR_VISITED;
							do {
								std::vector<nspec *> ns_chunk;
								rc = eval_simple_selspec(policy, dselspec->chunks[c], dup_ninfo_arr,
											 pl, resresv, flags | EVAL_OKBREAK, ns_chunk, err);

								if (rc) {
									any_succ_rc = true;
									tot++;
									dselspec->chunks[c]->num_chunks--;

									for (const auto &ns : ns_chunk) {
										req = ns->resreq;
										while (req != NULL) {
											if (req->type.is_consumable) {
												res = find_resource(ns->ninfo->res, req->def);
												if (res != NULL) {
													if (res->indirect_res != NULL)
														res = res->indirect_res;

													res->assigned += req->amount;
												}
											}
											req = req->next;
										}
										ns->ninfo = find_node_by_indrank(nptr, ns->ninfo->node_ind, ns->ninfo->rank);
									}
									nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
								} else {
									free_nspecs(ns_chunk);

									if (failerr->status_code == SCHD_UNKWN)
										move_schd_error(failerr, err);
									clear_schd_error(err);
								}
							} while (rc && dselspec->chunks[c]->num_chunks > 0);
						}
					} else {
						char reason[MAX_LOG_SIZE] = {0};

						if (hostsets[i]->free_nodes == 0)
							strcpy(reason, "No free nodes available");
						else
							translate_fail_code(err, NULL, reason);

						log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG,
							   resresv->name, "Insufficient host-level resources %s", reason);
#ifdef NAS /* localmod 998 */
						set_schd_error_codes(err, NOT_RUN, RESOURCES_INSUFFICIENT);
						set_schd_error_arg(err, ARG1, "Host");
						set_schd_error_arg(err, ARG2, hostsets[i]->name);
#endif /* localmod 998 */
						/* don't be so specific in the comment since it's only for a single host */
						set_schd_error_arg(err, ARG1, NULL);

						if (failerr->status_code == SCHD_UNKWN)
							move_schd_error(failerr, err);
						clear_schd_error(err);
					}
				}
				free_nodes(dup_ninfo_arr);
			} else {
				log_eventf(PBSEVENT_DEBUG, PBS_EVENTCLASS_NODE, LOG_DEBUG, resresv->name,
					   "Unexpected Placement: not %s, %s, %s, or %s",
					   PLACE_Scatter, PLACE_VScatter, PLACE_Pack, PLACE_Free);
			}
			if (any_succ_rc) {
				if (do_exclhost) {
					/* If we're in a placement set dninfo_arr might not contain the whole hostset set.
					 * We need to grab the hostset from the node
					 */
					if (dninfo_arr[0]->hostset != NULL)
						alloc_rest_nodepart(nsa, dninfo_arr[0]->hostset->ninfo_arr);
					else
						alloc_rest_nodepart(nsa, dninfo_arr);
				}
				nspec_arr.insert(nspec_arr.end(), nsa.begin(), nsa.end());
			}
		}
	} else
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);

	if (dselspec != NULL)
		delete dselspec;

	if (tot == spec->total_chunks)
		return true;

	if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
		move_schd_error(err, failerr);

	return false;
}

/**
 * @brief
 * 		handle a complex (plus'd) select spec
 *
 * @param[in]	policy	-	policy info
 * @param[in]	spec	-	the select spec
 * @param[in]	ninfo_arr	-	array of nodes to satisify the spec
 * @param[in]	pl	-	parsed placement spec
 * @param[in]	resresv	-	the resource resv the spec if from
 * @param[in]	flags	-	flags to change functions behavior
 *	      					EVAL_OKBREAK - ok to break chunck up across vnodes
 *	      					EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	nspec_arr	-	the node solution
 * @param[out]	err	-	error structure to return error information
 *
 * @retval	true	: if the selspec can be satisfied
 * @retval	false	: if not
 *
 */
bool
eval_complex_selspec(status *policy, selspec *spec, node_info **ninfo_arr, place *pl,
		     resource_resv *resresv, unsigned int flags, std::vector<nspec *> &nspec_arr, schd_error *err)
{
	std::vector<nspec *> nsa; /* the nspec array to hold node solution */
	node_info **nodes;	  /* nodes to search through (possibly duplicated) */
	int rc = 1;		  /* used as a return code in the complex spec case */
	int tot_nodes;		  /* total number of nodes on the server */
	int num_nodes_used = 0;	  /* number of nodes used to satisfy spec */

	/* number of nodes used with the no_multinode_job flag set */
	int num_no_multi_nodes = 0;

	int chunks_needed = 0;

	int k;
	int n;
	int c;
	resource_req *req;
	schd_resource *res;

	if (spec == NULL || ninfo_arr == NULL)
		return false;

	/* we have a simple selspec... just pass it along */
	if (spec->total_chunks == 1)
		return eval_simple_selspec(policy, spec->chunks[0], ninfo_arr,
					   pl, resresv, flags, nspec_arr, err);

	tot_nodes = count_array(ninfo_arr);

	/* we have a complex select spec
	 * This makes things more complicated now... we can make a single pass
	 * through our nodes and will possibly come up with a solution... but
	 * there is always the chance we could swap out nodes depending on one
	 * node being able to satisfy multiple simple specs.
	 * This recursion could take very long to finish.
	 *
	 * We'll go through the nodes once since it'll probably be fine for most
	 * cases.
	 */

	if (pl->scatter || pl->vscatter) {
		nodes = ninfo_arr;
		for (k = 0; nodes[k] != 0; k++)
			nodes[k]->nscr &= ~NSCR_SCATTERED;
	} else {
		if ((nodes = dup_nodes(ninfo_arr, resresv->server, NO_FLAGS)) == NULL) {
			/* only free array if we allocated it locally */
			return false;
		}
	}

	n = -1;
	for (c = 0, chunks_needed = 0; c < spec->total_chunks && rc > 0; c++) {
		std::vector<nspec *> ns_chunk;
		if (chunks_needed == 0) {
			n++;
			chunks_needed = spec->chunks[n]->num_chunks;
			for (k = 0; nodes[k] != 0; k++)
				nodes[k]->nscr &= ~NSCR_VISITED;
		}

		rc = eval_simple_selspec(policy, spec->chunks[n], nodes, pl, resresv, flags, ns_chunk, err);

		if (rc) {
			for (auto &ns : ns_chunk) {
				num_nodes_used++;
				if (ns->ninfo->no_multinode_jobs)
					num_no_multi_nodes++;

				if (pl->scatter || pl->vscatter)
					ns->ninfo->nscr |= NSCR_SCATTERED;
				else {
					req = ns->resreq;
					while (req != NULL) {
						res = find_resource(ns->ninfo->res, req->def);
						if (res != NULL)
							res->assigned += req->amount;

						req = req->next;
					}
					/* replace the dup'd node with the real one */
					ns->ninfo = find_node_by_indrank(ninfo_arr, ns->ninfo->node_ind, ns->ninfo->rank);
				}

				/* if policy is avoid provision, continue to use aoe-sorted list
				 * of nodes.
				 */
				if (conf.provision_policy != AVOID_PROVISION &&
				    !cstat.node_sort->empty() && conf.node_sort_unused)
					qsort(nodes, tot_nodes, sizeof(node_info *), multi_node_sort);
			}
			chunks_needed--;
			nsa.insert(nsa.end(), ns_chunk.begin(), ns_chunk.end());
		}
	}

	if (rc) {
		nspec_arr.insert(nspec_arr.end(), nsa.begin(), nsa.end());
		nsa.clear();
	} else
		free_nspecs(nsa);

	if (!(pl->scatter || pl->vscatter))
		free_nodes(nodes);

	if (num_no_multi_nodes == 0 ||
	    (num_no_multi_nodes == 1 && num_nodes_used == 1))
		return rc;

	/* if we've reached this point we're a multi node job and have selected
	 * a node which requested to not be used for multi-node jobs.  We'll
	 * mark the job as a job which will use multiple nodes and use tail
	 * recursion to resatisify the job without the nodes which are marked
	 * as no multi-node jobs
	 */
	resresv->will_use_multinode = 1;
	log_event(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
		  "Used multiple nodes with no_multinode_job=true: Resatisfy");

	if (!nspec_arr.empty())
		free_nspecs(nspec_arr);

	return eval_complex_selspec(policy, spec, ninfo_arr, pl, resresv, flags, nspec_arr, err);
}

/**
 * @brief
 * 		eval a non-plused select spec for satisfiability
 *
 * @param[in]	policy	-	policy info
 * @param[in]	chk	-	the chunk to satisfy
 * @param[in]	pninfo_arr	-	the array of nodes
 * @param[in]	pl	-	placement information (from -l place)
 * @param[in]	resresv	-	the job the spec is from - needed for resvs
 * @param[in]	flags	-	flags to change functions behavior
 *	      					EVAL_OKBREAK - ok to break chunck up across vnodes
 *	      					EVAL_EXCLSET - allocate entire nodelist exclusively
 * @param[out]	nspec_arr	-	the node solution
 * @param[out]	err	-	error structure to return error information
 *
 * @return	bool
 * @retval	true	: if the select spec is satisfiable
 * @retval	false	: if not
 *
 */
bool
eval_simple_selspec(status *policy, chunk *chk, node_info **pninfo_arr,
		    place *pl, resource_resv *resresv, unsigned int flags,
		    std::vector<nspec *> &nspec_arr, schd_error *err)
{
	int chunks_found = 0;		      /* number of nodes found to satisfy a subspec */
	resource_req *specreq_noncons = NULL; /* non-consumable resources requested by spec */
	resource_req *specreq_cons = NULL;    /* consumable resources requested by spec */
	resource_req *req = NULL;	      /* used to determine if we're done */
	resource_req *prevreq = NULL;	      /* used to determine if we're done */
	resource_req *tmpreq = NULL;	      /* used to unlink and free */
	bool need_new_nspec = false;	      /* need to allocate a new nspec for node solution */

	bool allocated = false; /* did we allocate resources to a vnode */
	int i = 0;
	int k = 0;

	char *str_chunk = NULL; /* ptr to after the number of chunks in the str_chunk */

	node_info **ninfo_arr = NULL;

	static schd_error *failerr = NULL;

	resource_req *aoereq = NULL;
	nspec *ns = NULL;

	std::vector<nspec *> nsa;

	if (chk == NULL || pninfo_arr == NULL || resresv == NULL || pl == NULL)
		return false;

	if (failerr == NULL) {
		failerr = new_schd_error();
		if (failerr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
	}

	/* if it's OK to break across vnodes, but we can fully fit on one
	 * vnode, then lets do that rather then possibly breaking across multiple
	 */
	if ((flags & EVAL_OKBREAK) &&
	    can_fit_on_vnode(chk->req, pninfo_arr)) {
		flags &= ~EVAL_OKBREAK;
	}

	/* we need to dup the nodes to handle indirect resources which need to be
	 * accounted for between nodes allocated to the job.  The only time we
	 * need to account for for this is when we're breaking a chunks across
	 * vnodes.  Otherwise the entire chunk is going onto 1 vnode.
	 */
	if (flags & EVAL_OKBREAK) {
		ninfo_arr = dup_nodes(pninfo_arr, resresv->server, NO_FLAGS);
		if (ninfo_arr == NULL) {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return false;
		}
	} else
		ninfo_arr = pninfo_arr;

	/* find the requested resources part of a chunk, not the number requested */
	for (i = 0; isdigit(chk->str_chunk[i]); i++)
		;

	if (chk->str_chunk[i] == ':')
		i++;

	str_chunk = &chk->str_chunk[i];

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
		   resresv->name, "Evaluating subchunk: %s", str_chunk);

	/* We're duplicating the entire list here.  This list is organized so that
	 * all non-consumable resources come before the consumable ones.  After
	 * duplicating, we split it into the consumable and non-consumable lists.
	 */
	specreq_noncons = dup_resource_req_list(chk->req);
	clear_schd_error(failerr);

	if (specreq_noncons == NULL) {
		set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);

		if (flags & EVAL_OKBREAK)
			free_nodes(ninfo_arr);
		return false;
	}

	if (resresv->aoename != NULL) {
		resresv->is_prov_needed = 1;
		aoereq = find_resource_req(specreq_noncons, allres["aoe"]);
		/* Provisionable node needed only if placement=pack or
		 * subchunk consists aoe resource request.
		 */
		if (!pl->pack && aoereq == NULL)
			resresv->is_prov_needed = 0;
	}

	for (req = specreq_noncons; req != NULL && req->type.is_non_consumable;
	     prevreq = req, req = req->next)
		;

	specreq_cons = req;
	if (prevreq != NULL)
		prevreq->next = NULL;
	else
		specreq_noncons = NULL; /* no non-consumable resources */

	ns = new nspec();

	for (i = 0; ninfo_arr[i] != NULL && chunks_found == 0; i++) {
		if (ninfo_arr[i]->nscr)
			continue;

		allocated = false;
		clear_schd_error(err);
		if (ninfo_arr[i]->lic_lock) {

			if (need_new_nspec) {
				need_new_nspec = false;
				ns = new nspec();
			}

			if (is_vnode_eligible_chunk(specreq_noncons, ninfo_arr[i], resresv, err)) {
				if (specreq_cons != NULL)
					allocated = resources_avail_on_vnode(specreq_cons, ninfo_arr[i],
									     pl, resresv, flags, ns, err);
				if (allocated) {
					nsa.push_back(ns);
					need_new_nspec = true;
					ns->seq_num = chk->seq_num;
					ns->sub_seq_num = get_sched_rank();

					if (flags & EVAL_OKBREAK) {
						/* search through requested consumable resources for resources we've
						 * completely allocated.  We'll unlink and free the resource_req
						 */
						prevreq = NULL;
						req = specreq_cons;
						while (req != NULL) {
							if (req->amount == 0) {
								tmpreq = req;
								if (prevreq == NULL)
									req = specreq_cons = req->next;
								else
									req = prevreq->next = req->next;

								free_resource_req(tmpreq);
							} else {
								prevreq = req;
								req = req->next;
							}
						}
						if (specreq_cons == NULL) {
							chunks_found = 1;
							/* we found our solution, we don't need any more nspec's */
							need_new_nspec = false;
							ns->end_of_chunk = 1;
						}

						/* Replace the dup'd node with the real one, but only if we dup'd the nodes */
						if (pninfo_arr != ninfo_arr) {
							/* Need to call find_node_by_rank() over indrank since eval_placement might dup the nodes */
							ns->ninfo = find_node_by_rank(pninfo_arr, ns->ninfo->rank);
						}
					} else {
						chunks_found = 1;
						/* we found our solution, we don't need any more nspec's */
						need_new_nspec = false;
						ns->end_of_chunk = 1;
					}
				} else {
					ninfo_arr[i]->nscr |= NSCR_VISITED;
					if (failerr->status_code == SCHD_UNKWN)
						copy_schd_error(failerr, err);
				}
			} else {
				ninfo_arr[i]->nscr |= NSCR_VISITED;
				if (failerr->status_code == SCHD_UNKWN)
					copy_schd_error(failerr, err);
			}

		} else
			set_schd_error_codes(err, NOT_RUN, NODE_UNLICENSED);

		if (err->error_code != SUCCESS) {
			schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				   ninfo_arr[i]->name, NULL, err);
			/* Since this node is not eligible, check if it ever eligible
			 * If it is never eligible, mark all nodes like it visited.
			 * If we can break, don't bother with equivalence classes because
			 * because the chunk is pretty much equivalent to ncpus=1 at that point
			 */
			if (ninfo_arr[i]->nodesig_ind >= 0 && !(flags & EVAL_OKBREAK)) {
				if (check_avail_resources(ninfo_arr[i]->res, chk->req,
							  COMPARE_TOTAL | UNSET_RES_ZERO | CHECK_ALL_BOOLS,
							  policy->resdef_to_check_no_hostvnode,
							  INSUFFICIENT_RESOURCE, err) == 0) {
					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
						   "", "Marking nodes with signature %s ineligible", ninfo_arr[i]->nodesig);
					for (k = 0; ninfo_arr[k] != NULL; k++) {
						if (ninfo_arr[k]->nodesig_ind == ninfo_arr[i]->nodesig_ind) {
							ninfo_arr[k]->nscr |= NSCR_VISITED;
							if (i != k)
								schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
									   ninfo_arr[k]->name, NULL, err);
						}
					}
				}
			}

		} else {
			log_event(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
				  ninfo_arr[i]->name, "Node allocated to job");
		}
	}

	if (specreq_cons != NULL)
		free_resource_req_list(specreq_cons);
	if (specreq_noncons != NULL)
		free_resource_req_list(specreq_noncons);

	if (flags & EVAL_OKBREAK)
		free_nodes(ninfo_arr);

	if (chunks_found) {
		nspec_arr.insert(nspec_arr.end(), nsa.begin(), nsa.end());
		log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG,
			   resresv->name, "Allocated one subchunk: %s", str_chunk);
		clear_schd_error(err);
		return true;
	}

	/* If we didn't allocate any nodes, we need to clean up any nspecs
	 * we've allocated.  This is either the one we allocated in the front of
	 * the main loop above, or for all the nodes we allocated and need to
	 * "deallocate" due to a reason we've decided we can't allocate like exclhost
	 */
	free_nspecs(nsa);
	nsa.clear();

	log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, resresv->name,
		   "Failed to satisfy subchunk: %s", chk->str_chunk);

	/* If the last node we looked at was fine, err would be empty.
	 * Actually return an a real error */
	if (err->status_code == SCHD_UNKWN && failerr->status_code != SCHD_UNKWN)
		move_schd_error(err, failerr);
	/* don't be so specific in the comment since it's only for a single node */
	set_schd_error_arg(err, ARG1, NULL);
	return false;
}

/**
 * @brief
 * 		evaluate one node to see if it is eligible
 *			    for a simple select spec and return the number
 *			    of chunks it can satisfy
 *
 * @param[in]	specreq	-	resources in the select spec
 * @param[in]	node	-	the node to evaluate
 * @param[in]	pl	-	place spec for request
 * @param[in]	resresv	-	resource resv which is requesting
 * @param[in]	flags	-	flags to change behavior of function
 *							EVAL_OKBREAK - OK to break chunk across vnodes
 * @param[out]	err	-	error status if node is ineligible
 *
 * @par NOTE:
 * 		all resources in specreq will be honored regardless of
 *      whether they are in conf.res_to_check or not due to the fact
 *		that chunk resources only contain such resources.
 *
 * @retval	true	: if node is statically eligible to run the request
 * @retval	false	: if node is ineligible
 *
 */
bool
is_vnode_eligible(node_info *node, resource_resv *resresv,
		  struct place *pl, schd_error *err)
{
	if (node == NULL || resresv == NULL || pl == NULL || err == NULL)
		return false;

	bool job_in_maintenance_resv = false;
	if (resresv->job && resresv->job->resv)
		if (resresv->job->resv->name[0] == 'M')
			job_in_maintenance_resv = true;

	/* A node is invalid for an exclusive job if jobs/resvs are running on it
	 * except if the job is a maintenance reservation
	 * NOTE: this check must be the first check or exclhost may break
	 */
	if (!job_in_maintenance_resv && is_excl(pl, node->sharing) &&
	    (node->num_jobs > 0 || node->num_run_resv > 0)) {
		set_schd_error_codes(err, NOT_RUN, NODE_NOT_EXCL);
		set_schd_error_arg(err, ARG1, resresv->is_job ? "Job" : "Reservation");
		return false;
	}

	/* Does this chunk have EOE? */
	if (resresv->eoename != NULL) {
		if (!is_eoe_avail_on_vnode(node, resresv)) {
			set_schd_error_codes(err, NOT_RUN, EOE_NOT_AVALBL);
			set_schd_error_arg(err, ARG1, resresv->eoename);
			return false;
		}
	}

	if (!node->is_free) {
		set_schd_error_codes(err, NOT_RUN, INVALID_NODE_STATE);
		set_schd_error_arg(err, ARG1, (char *) node_state_to_str(node));
#ifdef NAS /* localmod 031 */
		set_schd_error_arg(err, ARG2, node->name);
#endif /* localmod 031 */
		return false;
	}

	/*
	 * If we are in the reservation's universe, we need to check the state of
	 * the node in the server's universe.  We may have provisioned the node
	 * and it could be down.
	 */
	if (resresv->job != NULL && resresv->job->resv != NULL) {
		if (node->svr_node != NULL) {
			if (node->svr_node->is_provisioning) {
				set_schd_error_codes(err, NOT_RUN, INVALID_NODE_STATE);
#ifdef NAS /* localmod 031 */
				set_schd_error_arg(err, ARG1, node->name);
				set_schd_error_arg(err, ARG2, node_state_to_str(node->svr_node));
#else
				set_schd_error_arg(err, ARG1, (char *) node_state_to_str(node->svr_node));
#endif /* localmod 031 */
				return false;
			}
		}
	}

	if (resresv->is_resv && !node->resv_enable) {
		set_schd_error_codes(err, NOT_RUN, NODE_RESV_ENABLE);
		return false;
	}

	if (resresv->is_job) {
		/* don't enforce max run limits of job is being qrun */
		if (resresv->server->qrun_job == NULL) {
			if (node->max_running != SCHD_INFINITY &&
			    node->max_running <= node->num_jobs) {
				set_schd_error_codes(err, NOT_RUN, NODE_JOB_LIMIT_REACHED);
				return false;
			}

			if (node->max_user_run != SCHD_INFINITY &&
			    node->max_user_run <= find_counts_elm(node->user_counts, resresv->user, NULL, NULL, NULL)) {
				set_schd_error_codes(err, NOT_RUN, NODE_USER_LIMIT_REACHED);
				return false;
			}

			if (node->max_group_run != SCHD_INFINITY &&
			    node->max_group_run <= find_counts_elm(node->group_counts, resresv->group, NULL, NULL, NULL)) {
				set_schd_error_codes(err, NOT_RUN, NODE_GROUP_LIMIT_REACHED);
				return false;
			}
		}
	}

	if (node->no_multinode_jobs && resresv->will_use_multinode) {
		set_schd_error_codes(err, NOT_RUN, NODE_NO_MULT_JOBS);
		return false; /* multiple nodes jobs/resvs not allowed on this node */
	}

	return true;
}
/**
 * @brief
 * 		check if a vnode is eligible for a chunk
 *
 * @param[in]	specreq	-	resources from chunk
 * @param[in]	node	-	vnode tocheck
 * @param[out]	err	-	error structure
 *
 * @return	bool
 * @retval	true	: eligible
 * @retval	false	: not eligible
 */
bool
is_vnode_eligible_chunk(resource_req *specreq, node_info *node,
			resource_resv *resresv, schd_error *err)
{
	if (resresv != NULL) {
		if (node->no_multinode_jobs && resresv->will_use_multinode) {
			set_schd_error_codes(err, NOT_RUN, NODE_NO_MULT_JOBS);
			return false; /* multiple nodes jobs/resvs not allowed on this node */
		}
	}

	if (specreq != NULL) {
		if (check_avail_resources(node->res, specreq,
					  CHECK_ALL_BOOLS | ONLY_COMP_NONCONS | UNSET_RES_ZERO,
					  INSUFFICIENT_RESOURCE, err) == 0) {
			return false;
		}
	}

	return true;
}

/**
 * @brief
 *	Checks if a vnode is eligible for power operations.
 *  Based on is_provisionable.
 *
 * @par Functionality:
 *	This function checks if a vnode is eligible to be provisioned.
 *	A vnode is eligible for power operations if it satisfies all of the
 *	following conditions:-
 *	(1) Server has power_provisioning True,
 *	(2) Vnode has power_provisioning True,
 *	(3) No conflicts with reservations already running on the Vnode
 *	(4) No conflicts with jobs already running on the Vnode
 *
 * @param[in]		node	-	pointer to node_info
 * @param[in]		resresv	-	pointer to resource_resv
 * @param[in,out]	err		-	pointer to schd_error
 *
 * @return	int
 * @retval	 NO_PROVISIONING_NEEDED : resresv doesn't request eoe
 *			or resresv is not a job
 * @retval	 PROVISIONING_NEEDED : vnode doesn't have current_eoe set
 *          or it doesn't match job eoe
 * @retval	 NOT_PROVISIONABLE  : vnode is not provisionable
 *			(see err for more details)
 *
 * @par Side Effects:
 *	Unknown
 *
 * @par MT-safe: No
 *
 */
int
is_powerok(node_info *node, resource_resv *resresv, schd_error *err)
{
	int ret = NO_PROVISIONING_NEEDED;

	if (!resresv->is_job)
		return NO_PROVISIONING_NEEDED;
	if (resresv->eoename == NULL)
		return NO_PROVISIONING_NEEDED;
	if (!resresv->server->power_provisioning) {
		err->error_code = PROV_DISABLE_ON_SERVER;
		return NOT_PROVISIONABLE;
	}
	if (!node->power_provisioning) {
		err->error_code = PROV_DISABLE_ON_NODE;
		return NOT_PROVISIONABLE;
	}

	/* node doesn't have eoe or it doesn't match job eoe */
	if (node->current_eoe == NULL ||
	    strcmp(resresv->eoename, node->current_eoe) != 0) {
		ret = PROVISIONING_NEEDED;

		/* there can't be any jobs on the node */
		if ((node->num_susp_jobs > 0) || (node->num_jobs > 0)) {
			err->error_code = PROV_RESRESV_CONFLICT;
			return NOT_PROVISIONABLE;
		}
	}

	/* node cannot be shared between running reservation without EOE
	 * and job with EOE
	 */
	if (node->run_resvs_arr) {
		for (int i = 0; node->run_resvs_arr[i]; i++) {
			if (node->run_resvs_arr[i]->eoename == NULL) {
				err->error_code = PROV_RESRESV_CONFLICT;
				return NOT_PROVISIONABLE;
			}
		}
	}

	return ret;
}

/**
 * @brief
 * 		check to see if there are enough
 *		consumable resources on a vnode to make it
 *		eligible for a request
 *		Note: This function will allocate <= 1 chunk
 *
 * @param[in][out] specreq_cons - IN : requested consumable resources
 *				  OUT: requested - allocated resources
 * @param[in]	node	-	the node to evaluate
 * @param[in]	pl	-	place spec for request
 * @param[in]	resresv	-	resource resv which is requesting
 * @param[in]	flags	-	flags to change behavior of function
 *              			EVAL_OKBREAK - OK to break chunk across vnodes
 * @param[out]	err	-	error status if node is ineligible
 *
 *	@retval	true	: if resources were allocated from the node
 *	@retval false	: if sufficent resources are not available (err is set)
 */
bool
resources_avail_on_vnode(resource_req *specreq_cons, node_info *node,
			 place *pl, resource_resv *resresv, unsigned int flags,
			 nspec *ns, schd_error *err)
{
	/* used for allocating partial chunks */
	resource_req tmpreq = {0};
	resource_req *req;
	resource_req *newreq, *aoereq;
	long long num_chunks = 0;
	int is_p;

	if (specreq_cons == NULL || node == NULL ||
	    resresv == NULL || pl == NULL || err == NULL)
		return false;

	if (flags & EVAL_OKBREAK) {
		bool allocated = false;

		/* req is the first consumable resource at this point */
		for (req = specreq_cons; req != NULL; req = req->next) {
			if (req->type.is_consumable) {
				auto num = req->amount;
				tmpreq.amount = 1;

				tmpreq.name = req->name;
				tmpreq.type = req->type;
				tmpreq.res_str = req->res_str;
				tmpreq.def = req->def;
				tmpreq.next = NULL;
				num_chunks = check_resources_for_node(&tmpreq, node, resresv, err);

				if (num_chunks > 0) {
					is_p = is_provisionable(node, resresv, err);
					if (is_p == NOT_PROVISIONABLE) {
						allocated = false;
						break;
					} else if (is_p == PROVISIONING_NEEDED) {
						if (ns != NULL)
							ns->go_provision = 1;
						/* Do not set current aoe/eoe on the node when placement is scatter/vscatter
						 * because in case of scatter/vscatter placement we are not working on duplicate
						 * copy of nodes.
						 */
						if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1)
							set_current_aoe(node, resresv->aoename);
						if (resresv->is_job) {
							log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_NOTICE, resresv->name,
								   "Vnode %s selected for provisioning with AOE %s", node->name.c_str(), resresv->aoename);
						}
					}

					/* check if power eoe needs to be considered */
					is_p = is_powerok(node, resresv, err);
					if (is_p == NOT_PROVISIONABLE) {
						allocated = false;
						break;
					} else if (is_p == PROVISIONING_NEEDED) {
						if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1)
							set_current_eoe(node, resresv->eoename);

						if (resresv->is_job)
							log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_JOB, LOG_NOTICE, resresv->name,
								   "Vnode %s selected for power with EOE %s", node->name.c_str(), resresv->eoename);
					}

					if (num_chunks > num)
						num_chunks = num;

					if (ns != NULL) {
						newreq = dup_resource_req(req);
						if (newreq == NULL)
							return false;

						newreq->amount = num_chunks;

						if (ns->ninfo == NULL) /* check if this is the first res */
							ns->ninfo = node;

						newreq->next = ns->resreq;
						ns->resreq = newreq;
					}

					/* now that we have allocated some resources to this node, we need
					 * to remove them from the requested amount
					 */
					req->amount -= num_chunks;

					auto res = find_resource(node->res, req->def);
					if (res != NULL) {
						if (res->indirect_res != NULL)
							res->indirect_res->assigned += num_chunks;
						else
							res->assigned += num_chunks;
					}

					/* use tmpreq to wrap the amount so we can use res_to_str */
					tmpreq.amount = num_chunks;

					log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, node->name,
						   "vnode allocated %s=%s", req->name, res_to_str(&tmpreq, RF_REQUEST));

					allocated = true;
				}
			}
		}
		if (allocated) {
			if (ns != NULL && ns->go_provision != 0) {
				aoereq = create_resource_req("aoe", resresv->aoename);
				if (aoereq != NULL) {
					aoereq->next = ns->resreq;
					ns->resreq = aoereq;
				}
			}

			if (pl->pack && num_chunks == 1 && cstat.smp_dist == SMP_ROUND_ROBIN)
				pbs_strncpy(last_node_name, node->name.c_str(), sizeof(last_node_name));
			return true;
		}
	} else {
		num_chunks = check_resources_for_node(specreq_cons, node, resresv, err);
		if (num_chunks > 0) {
			is_p = is_provisionable(node, resresv, err);
			if (is_p == NOT_PROVISIONABLE)
				return false;

			else if (is_p == PROVISIONING_NEEDED) {
				if (ns != NULL)
					ns->go_provision = 1;
				if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1) {
					set_current_aoe(node, resresv->aoename);
				}
			}

			is_p = is_powerok(node, resresv, err);
			if (is_p == NOT_PROVISIONABLE)
				return false;
			else if (is_p == PROVISIONING_NEEDED) {
				if (resresv->select->total_chunks > 1 && pl->scatter != 1 && pl->vscatter != 1) {
					set_current_eoe(node, resresv->eoename);
				}
			}
		}

		/* if we have infinite amount of resources, the node has been allocated */
		if (num_chunks == SCHD_INFINITY)
			num_chunks = 1;

		if (ns != NULL && num_chunks != 0) {
			ns->ninfo = node;
			ns->resreq = dup_resource_req_list(specreq_cons);

			if (ns->go_provision != 0) {
				aoereq = create_resource_req("aoe", resresv->aoename);
				if (aoereq != NULL) {
					aoereq->next = ns->resreq;
					ns->resreq = aoereq;
				}
			}

			if (pl->pack && cstat.smp_dist == SMP_ROUND_ROBIN)
				pbs_strncpy(last_node_name, node->name.c_str(), sizeof(last_node_name));
		}
		return num_chunks ? true : false;
	}

	return false;
}

/**
 * @brief
 * 		check to see how many chunks can fit on a
 *		node looking at both resources available
 *		now and future advanced reservations
 *
 * @param[in]	resreq	-	requested resources
 * @param[in]	node    -	node to check for
 * @param[in]	resresv -	the resource resv to check for
 * @param[out]	err    -	schd_error reply if there aren't enough resources
 *
 * @par NOTE:
 * 		all resources in resreq will be honored regardless of
 *      whether they are in conf.res_to_check or not due to the fact
 *		that chunk resources only contain such resources.
 *
 * @retval
 * 		number of chunks which can be satisifed during the duration
 * @retval	-1	: on error
 */
long long
check_resources_for_node(resource_req *resreq, node_info *ninfo,
			 resource_resv *resresv, schd_error *err)
{
	/* the minimum number of chunks which can be satisified for the duration
	 * of the request
	 */
	long long min_chunks = UNSPECIFIED;
	long long chunks = UNSPECIFIED; /*number of chunks which can be satisfied*/

	time_t end_time;

	timed_event *event;

	if (resreq == NULL || ninfo == NULL || err == NULL || resresv == NULL)
		return -1;

	auto noderes = ninfo->res;

	min_chunks = check_avail_resources(noderes, resreq,
					   CHECK_ALL_BOOLS | UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err);

	if (chunks != UNSPECIFIED && (min_chunks == SCHD_INFINITY || chunks < min_chunks))
		min_chunks = chunks;

	auto calendar = ninfo->server->calendar;
	auto cur_time = ninfo->server->server_time;
	if (resresv->duration != resresv->hard_duration &&
	    exists_resv_event(calendar, cur_time + resresv->hard_duration))
		end_time = cur_time + calc_time_left(resresv, 1);
	else
		end_time = cur_time + calc_time_left(resresv, 0);

	/* check if there are any timed events to check for conflicts with. We do not
	 * need to check for timed conflicts if the current object is a job inside a
	 * reservation.
	 */
	if (min_chunks > 0 && exists_run_event(calendar, end_time) && !(resresv->job != NULL && resresv->job->resv != NULL)) {
		/* Check for possible conflicts with timed events by walking the sorted
		 * event list that was created in eval_selspec. This runs a simulation
		 * forward in time to account for timed events consuming and/or releasing
		 * resources.
		 *
		 * For example, if a resource_resv such as a reservation is consuming n cpus
		 * from t1 to t2, then the resources should be taken out at t1 and returned
		 * at t2.
		 */
		auto nres = dup_ind_resource_list(noderes);
		auto resresv_excl = is_excl(resresv->place_spec, ninfo->sharing);

		if (nres != NULL) {
			/* Walk the event list by time such that the start of an event always
			 * precedes the end of it. The event type (start or end event) is
			 * determined, and the resources are consumed if a start event, and
			 * released if an end event.
			 */
			event = get_next_event(calendar);
			const auto event_mask = TIMED_RUN_EVENT | TIMED_END_EVENT;

			for (event = find_init_timed_event(event, IGNORE_DISABLED_EVENTS, event_mask);
			     event != NULL && min_chunks > 0;
			     event = find_next_timed_event(event, IGNORE_DISABLED_EVENTS, event_mask)) {
				auto event_time = event->event_time;
				auto resc_resv = static_cast<resource_resv *>(event->event_ptr);
				nspec *ns;

				if (event_time < cur_time)
					continue;
				if (resc_resv->job != NULL && resc_resv->job->resv != NULL)
					continue;

				if (!resc_resv->nspec_arr.empty())
					ns = find_nspec_by_rank(resc_resv->nspec_arr, ninfo->rank);
				else {
					ns = NULL;
					log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_SCHED, LOG_WARNING, resresv->name,
						   "Event %s is a run/end event w/o nspec array, ignoring event", event->name.c_str());
				}

				auto is_run_event = (event->event_type == TIMED_RUN_EVENT);

				if ((event_time < end_time) && resresv != resc_resv && ns != NULL) {
					/* One event will need provisioning while the other will not,
					 * they cannot co exist at same time.
					 */
					if (resresv->aoename != NULL && resc_resv->aoename == NULL) {
						set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
						min_chunks = 0;
						break;
					}

					if (is_excl(resc_resv->place_spec, ninfo->sharing) || resresv_excl) {
						min_chunks = 0;
					} else {
						for (auto cur_res = nres; cur_res != NULL; cur_res = cur_res->next) {
							if (cur_res->type.is_consumable) {
								auto req = find_resource_req(ns->resreq, cur_res->def);
								if (req != NULL) {
									cur_res->assigned += is_run_event ? req->amount : -req->amount;
								}
							}
						}
						if (is_run_event) {
							chunks = check_avail_resources(nres, resreq,
										       CHECK_ALL_BOOLS | UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, err);
							if (chunks < min_chunks)
								min_chunks = chunks;
						}
					}
				}
			}
			free_resource_list(nres);
		} else {
			set_schd_error_codes(err, NOT_RUN, SCHD_ERROR);
			return -1;
		}

		if (min_chunks == 0) {
			if (err->error_code != PROV_RESRESV_CONFLICT)
				set_schd_error_codes(err, NOT_RUN, RESERVATION_CONFLICT);
		}
	}

	return min_chunks;
}

/**
 * @brief compare two place specs to see if they are equal
 * @param[in] pl1 - place spec 1
 * @param[in] pl2 - place spec 2
 * @return  1 if equal 0 if not
 */
int
compare_place(place *pl1, place *pl2)
{
	if (pl1 == NULL && pl2 == NULL)
		return 1;
	else if (pl1 == NULL || pl2 == NULL)
		return 0;

	if (pl1->excl != pl2->excl)
		return 0;

	if (pl1->exclhost != pl2->exclhost)
		return 0;

	if (pl1->share != pl2->share)
		return 0;

	if (pl1->free != pl2->free)
		return 0;

	if (pl1->pack != pl2->pack)
		return 0;

	if (pl1->scatter != pl2->scatter)
		return 0;

	if (pl1->vscatter != pl2->vscatter)
		return 0;

	if (pl1->group != NULL && pl2->group != NULL) {
		if (strcmp(pl1->group, pl2->group))
			return 0;
	} else if (pl1->group != NULL || pl2->group != NULL)
		return 0;

	return 1;
}

/**
 * @brief
 *		parse_placespec - allocate a new place structure and parse
 *		a placement spec (-l place)
 *
 * @param[in]	place_str	-	placespec as a string
 *
 * @return	newly allocated place
 * @retval	NULL	: invalid placement spec
 *
 */
place *
parse_placespec(char *place_str)
{
	/* copy place spec into - max log size should be big enough */
	char str[MAX_LOG_SIZE];
	char *tok;
	char *tokptr;
	int invalid = 0;
	place *pl;

	if (place_str == NULL)
		return NULL;

	pl = new_place();

	if (pl == NULL)
		return NULL;

	pbs_strncpy(str, place_str, sizeof(str));

	tok = string_token(str, ":", &tokptr);

	while (tok != NULL && !invalid) {
		if (!strcmp(tok, PLACE_Pack))
			pl->pack = 1;
		else if (!strcmp(tok, PLACE_Scatter))
			pl->scatter = 1;
		else if (!strcmp(tok, PLACE_Excl))
			pl->excl = 1;
		else if (!strcmp(tok, PLACE_Free))
			pl->free = 1;
		else if (!strcmp(tok, PLACE_Shared))
			pl->share = 1;
		else if (!strcmp(tok, PLACE_VScatter))
			pl->vscatter = 1;
		else if (!strcmp(tok, PLACE_ExclHost)) {
			pl->exclhost = 1;
			pl->excl = 1;
		} else if (!strncmp(tok, PLACE_Group, 5)) {
			/* format: group=res */
			if (tok[5] == '=') {
				/* "group=" is 6 characters so tok[6] should be the first character of
				 * the resource
				 */
				pl->group = string_dup(&tok[6]);
			} else
				invalid = 1;
		} else
			invalid = 1;

		tok = string_token(NULL, ":", &tokptr);
	}

	/* pack and scatter vscatter, and free are all mutually exclusive */
	if (pl->pack + pl->scatter + pl->free + pl->vscatter > 1)
		invalid = 1;

	/* if no scatter, vscatter, pack, or free given, default to free */
	if (pl->pack + pl->scatter + pl->free + pl->vscatter == 0)
		pl->free = 1;

	if (invalid) {
		free_place(pl);
		return NULL;
	}

	return pl;
}

/**
 * @brief
 * 		parse a select spec into a selspec structure with
 *		a dependant array of chunks.  Non-consuamble resources
 *		are sorted first in the chunk resource list
 *
 * @param[in]	selspec	-	the select spec to parse
 *
 * @return	selspec*
 * @retval	pointer to a selspec obtained by parsing the select spec
 *			of the job/resv.
 * @retval	NULL	: on error or invalid spec
 *
 * @par MT-safe: Yes
 */
selspec *
parse_selspec(const std::string &sspec)
{
	/* select specs can be large.  We need to allocate a buffer large enough
	 * to handle the spec.  We'll keep it around so we don't have to allocate
	 * it on every call
	 */
	char *specbuf = NULL;
	char *tmpptr;

	selspec *spec;
	int num_plus;
	const char *p;

	char *tok;
	char *endp = NULL;

	resource_req *req_head = NULL;
	resource_req *req_end = NULL;
	resource_req *req;
	int invalid = 0;

	int num_kv;
	struct key_value_pair *kv = NULL;
	int nkvelements = 0;

	int num_chunks;
	int num_cpus = 0;

	int i;
	int n = 0;

	const char *select_spec = sspec.c_str();

	if ((spec = new selspec()) == NULL)
		return NULL;

	for (num_plus = 0, p = select_spec; *p != '\0'; p++) {
		if (*p == '+')
			num_plus++;
	}

	/* num_plus + 2: 1 for the initial chunk 1 for the NULL ptr */
	if ((spec->chunks = static_cast<chunk **>(calloc(num_plus + 2, sizeof(chunk *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		delete spec;
		return 0;
	}

	specbuf = string_dup(select_spec);
	if (specbuf == NULL) {
		delete spec;
		log_err(errno, __func__, MEM_ERR_MSG);
		return 0;
	}

	tok = string_token(specbuf, "+", &endp);

	tmpptr = NULL;
	while (tok != NULL && !invalid) {
		tmpptr = string_dup(tok);
		auto ret = parse_chunk_r(tok, &num_chunks, &num_kv, &nkvelements, &kv, NULL);

		if (!ret) {
			for (i = 0; i < num_kv && !invalid; i++) {
				req = create_resource_req(kv[i].kv_keyw, kv[i].kv_val);

				if (req == NULL)
					invalid = 1;
				else {
					if (strcmp(req->name, "ncpus") == 0) {
						/* Given: -l select=nchunk1:ncpus=Y + nchunk2:ncpus=Z +... */
						/* Then: # of cpus = (nchunk1 * Y) + (nchunk2 * Z) + ... */
						num_cpus += (num_chunks * req->amount);
					}
					const auto &rtc = conf.res_to_check;
					if (!invalid && (req->type.is_boolean || rtc.empty() || rtc.find(kv[i].kv_keyw) != rtc.end())) {
						spec->defs.insert(req->def);
						if (req_head == NULL)
							req_end = req_head = req;
						else {
							if (req->type.is_consumable) {
								req_end->next = req;
								req_end = req;
							} else {
								req->next = req_head;
								req_head = req;
							}
						}
					} else
						free_resource_req(req);
				}
			}
			spec->chunks[n] = new_chunk();
			if (spec->chunks[n] != NULL) {
				spec->chunks[n]->num_chunks = num_chunks;
				spec->chunks[n]->seq_num = get_sched_rank();
				spec->total_chunks += num_chunks;
				spec->total_cpus = num_cpus;
				spec->chunks[n]->req = req_head;
				spec->chunks[n]->str_chunk = tmpptr;
				tmpptr = NULL;
				req_head = NULL;
				req_end = NULL;
				n++;
			} else
				invalid = 1;
		} else
			invalid = 1;

		tok = string_token(NULL, "+", &endp);
	}
	free(kv);

	if (invalid) {
		delete spec;
		if (tmpptr != NULL)
			free(tmpptr);

		free(specbuf);
		return NULL;
	}

	free(specbuf);

	return spec;
}

/**
 *	@brief compare two chunks for equality
 *	@param[in] c1 - first chunk
 * 	@param[in] c2 - second chunk
 *
 *	@return int
 *	@retval 1 if chunks are equal
 *	@retval 0 if chunks are not equal
 */
int
compare_chunk(chunk *c1, chunk *c2)
{
	if (c1 == NULL && c2 == NULL)
		return 1;
	if (c1 == NULL || c2 == NULL)
		return 0;

	if (c1->num_chunks != c2->num_chunks)
		return 0;
	if (compare_resource_req_list(c1->req, c2->req, conf.resdef_to_check) == 0)
		return 0;

	return 1;
}

/**
 *	@brief compare two selspecs for equality
 *	@param[in] s1 - first selspec
 *	@param[in] s2 - second selspec
 *
 *	@returns int
 *	@retval 1 if selspecs are equal
 *	@retval 0 if not equal
 */
int
compare_selspec(selspec *s1, selspec *s2)
{
	int ret = 1;

	if (s1 == NULL && s2 == NULL)
		return 1;
	else if (s1 == NULL || s2 == NULL)
		return 0;

	if (s1->total_chunks != s2->total_chunks)
		return 0;

	if (s1->chunks != NULL && s2->chunks != NULL) {
		for (int i = 0; ret && s1->chunks[i] != NULL; i++) {
			if (compare_chunk(s1->chunks[i], s2->chunks[i]) == 0)
				ret = 0;
		}
	} else
		ret = 0;
	return ret;
}

/**
 * @brief
 * 		create an execvnode from a node solution array
 *
 * @param[in]	ns	-	the nspec struct with the chosen nodes to run the job on
 *
 * @par MT-safe:	no
 *
 * @return	execvnode in static memory
 *
 */
char *
create_execvnode(std::vector<nspec *> &ns_arr)
{
	static char *execvnode = NULL;
	static int execvnode_size = 0;
	static char *buf = NULL;
	static int bufsize = 0;
	char buf2[128];
	resource_req *req;
	bool end_of_chunk = true;

	if (execvnode == NULL) {
		execvnode = static_cast<char *>(malloc(INIT_ARR_SIZE + 1));

		if (execvnode == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}
		execvnode_size = INIT_ARR_SIZE;
	}
	if (buf == NULL) {
		buf = static_cast<char *>(malloc(INIT_ARR_SIZE + 1));
		if (buf == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}
		bufsize = INIT_ARR_SIZE;
	}
	execvnode[0] = '\0';

	bool need_plus = false;
	for (const auto &ns : ns_arr) {
		if (need_plus)
			strcpy(buf, "+");
		else {
			need_plus = true;
			buf[0] = '\0';
		}

		if (end_of_chunk) {
			if (pbs_strcat(&buf, &bufsize, "(") == NULL)
				return NULL;
		}

		if (pbs_strcat(&buf, &bufsize, ns->ninfo->name.c_str()) == NULL)
			return NULL;

		end_of_chunk = ns->end_of_chunk;

		req = ns->resreq;
		while (req != NULL) {
			if (req->type.is_consumable) {
				if (pbs_strcat(&buf, &bufsize, ":") == NULL)
					return NULL;
				if (pbs_strcat(&buf, &bufsize, req->name) == NULL)
					return NULL;
				if (req->type.is_float)
					sprintf(buf2, "=%.*f", float_digits(req->amount, FLOAT_NUM_DIGITS), req->amount);
				else

					sprintf(buf2, "=%.0lf%s", ceil(req->amount),
						req->type.is_size ? "kb" : "");
				if (pbs_strcat(&buf, &bufsize, buf2) == NULL)
					return NULL;
			} else if (ns->go_provision && strcmp(req->name, "aoe") == 0) {
				strcpy(buf2, ":aoe=");
				if (pbs_strcat(&buf, &bufsize, buf2) == NULL)
					return NULL;
				if (pbs_strcat(&buf, &bufsize, req->res_str) == NULL)
					return NULL;
			}
			req = req->next;
		}
		if (end_of_chunk)
			if (pbs_strcat(&buf, &bufsize, ")") == NULL)
				return NULL;

		if (pbs_strcat(&execvnode, &execvnode_size, buf) == NULL)
			return NULL;
	}

	return execvnode;
}

/**
 * @brief
 *		parse_execvnode - parse an execvnode into an nspec array
 *
 * @param[in]	execvnode	-	the execvnode to parse
 * @param[in]	sinfo		-	server to get the nodes from
 * @param[in]	sel			- select to map
 *
 * @return	a newly allocated nspec array for the execvnode
 *
 */
std::vector<nspec *>
parse_execvnode(char *execvnode, server_info *sinfo, selspec *sel)
{
	char *simplespec;
	char *excvndup;
	char *node_name;
	int num_el;
	struct key_value_pair *kv = NULL;

	std::vector<nspec *> nspec_arr;
	node_info *ninfo;
	resource_req *req;
	int i, j;

	bool invalid = false;

	int num_chunk;
	int nlkv = 0;
	char *p;
	char *tailptr = NULL;
	int hp;
	int cur_chunk_num = 0;
	int cur_tot_chunks = 0;
	int chunks_ind;
	int num_paren = 0;
	int in_superchunk = 0;

	if (execvnode == NULL || sinfo == NULL)
		return {};

	p = execvnode;

	/* number of chunks is number of pluses + 1 */
	num_chunk = 1;

	while (p != NULL && *p != '\0') {
		if (*p == '+')
			num_chunk++;
		if (*p == '(')
			num_paren++;

		p++;
	}

	/* Number of chunks in exec_vnode don't match selspec, don't map chunks */
	if (sel != NULL && num_paren != sel->total_chunks)
		sel = NULL;

	if ((excvndup = string_dup(execvnode)) == NULL)
		return {};

	simplespec = parse_plus_spec_r(excvndup, &tailptr, &hp);
	if (hp > 0) /* simplespec starts with '(' but doesn't close */
		in_superchunk = 1;

	if (simplespec == NULL)
		invalid = true;
	else if (parse_node_resc_r(simplespec, &node_name, &num_el, &nlkv, &kv) != 0)
		invalid = true;

	if (sel != NULL) {
		cur_tot_chunks = sel->chunks[0]->num_chunks;
		chunks_ind = 0;
	}
	for (i = 0; i < num_chunk && !invalid && simplespec != NULL; i++) {
		auto ns = new nspec();
		nspec_arr.push_back(ns);
		ninfo = find_node_info(sinfo->nodes, node_name);
		if (ninfo != NULL) {
			ns->ninfo = ninfo;
			for (j = 0; j < num_el; j++) {
				req = create_resource_req(kv[j].kv_keyw, kv[j].kv_val);
				if (req != NULL) {
					if (ns->resreq == NULL)
						ns->resreq = req;
					else {
						req->next = ns->resreq;
						ns->resreq = req;
					}
				} else
					invalid = true;
			}
		} else {
			log_event(PBSEVENT_DEBUG, PBS_EVENTCLASS_JOB, LOG_DEBUG, node_name,
				  "Exechost contains a node that does not exist.");
			invalid = true;
		}
		if (sel != NULL) {
			/* This shouldn't happen since we checked above to make sure we could map properly */
			if (sel->chunks[chunks_ind] == NULL) {
				log_event(PBS_EVENTCLASS_NODE, PBS_EVENTCLASS_NODE, LOG_WARNING, __func__, "Select spec and exec_vnode/resv_nodes can not be mapped");
				free_nspecs(nspec_arr);
				return {};
			}
			ns->chk = sel->chunks[chunks_ind];
			ns->seq_num = ns->chk->seq_num;
		}
		if (!in_superchunk || hp < 0) {
			ns->end_of_chunk = 1;
			if (sel != NULL) {
				cur_chunk_num++;
				if (cur_chunk_num == cur_tot_chunks) {
					chunks_ind++;
					if (sel->chunks[chunks_ind] != NULL) {
						cur_tot_chunks = sel->chunks[chunks_ind]->num_chunks;
						cur_chunk_num = 0;
					}
				}
			}
		}

		if (!invalid) {
			simplespec = parse_plus_spec_r(tailptr, &tailptr, &hp);
			if (simplespec != NULL) {
				int ret;

				if (hp > 0) /* simplespec starts with '(' but doesn't end with ')' */
					in_superchunk = 1;
				else if (hp < 0) /* simplespec ends with ')' but does not start with '(' */
					in_superchunk = 0;
				/* hp == 0 simplespec either starts and ends with '(' ')' or has neither */

				ret = parse_node_resc_r(simplespec, &node_name, &num_el, &nlkv, &kv);
				if (ret < 0)
					invalid = true;
			}
		}
	}

	free(kv);
	free(excvndup);

	if (invalid) {
		log_eventf(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_WARNING, __func__,
			   "Failed to parse execvnode: %s", execvnode);
		free_nspecs(nspec_arr);
		return {};
	}

	return nspec_arr;
}

/**
 * @brief
 *		node_state_to_str - convert a node's state into a string for printing
 *
 * @param[in]	ninfo	-	the node
 *
 * @return	static string of node state
 *
 */
const char *
node_state_to_str(node_info *ninfo)
{
	if (ninfo == NULL)
		return "";

	if (ninfo->is_job_busy)
		return ND_jobbusy;

	if (ninfo->is_free)
		return ND_free;

	if (ninfo->is_down)
		return ND_down;

	if (ninfo->is_offline)
		return ND_offline;

	if (ninfo->is_resv_exclusive)
		return ND_resv_exclusive;

	if (ninfo->is_job_exclusive)
		return ND_job_exclusive;

	if (ninfo->is_busy)
		return ND_busy;

	if (ninfo->is_stale)
		return ND_Stale;

	if (ninfo->is_provisioning)
		return ND_prov;

	if (ninfo->is_sleeping)
		return ND_sleep;

	if (ninfo->is_maintenance)
		return ND_maintenance;

	/* default */
	return ND_state_unknown;
}

/**
 * @brief
 *		combine_nspec_array - find and combine any nspec's for the same node
 *		in an nspec array.  Because nspecs no longer map to the original chunks
 *		they came from, seq_num and chk no longer have meaning.  They are cleared.
 *
 * @param[in,out]	nspec_arr	-	array to combine
 *
 * @return	vector<nspec *>
 * @retval	combined nspec array (up to caller to free)
 * @retval	NULL on error
 *
 */
std::vector<nspec *>
combine_nspec_array(const std::vector<nspec *> &nspec_arr)
{
	std::vector<nspec *> new_nspec_arr;
	nspec *new_ns;
	std::unordered_map<int, nspec *> nspec_umap;

	if (nspec_arr.empty())
		return {};

	for (const auto &ns : nspec_arr) {
		auto numap = nspec_umap.find(ns->ninfo->rank);
		if (numap == nspec_umap.end()) {
			new_ns = new nspec();

			nspec_umap[ns->ninfo->rank] = new_ns;

			new_ns->end_of_chunk = true;
			new_ns->ninfo = ns->ninfo;
			new_ns->resreq = dup_resource_req_list(ns->resreq);
			new_nspec_arr.push_back(new_ns);
		} else {
			new_ns = numap->second;
			for (auto req_j = ns->resreq; req_j != NULL; req_j = req_j->next) {
				auto req_i = find_resource_req(new_ns->resreq, req_j->def);
				if (req_i != NULL) {
					/* we assume that if the resource is a boolean or a string
					 * the value is either the same, or doesn't exist
					 * so we don't need to do validity checking
					 */
					if (req_j->type.is_consumable)
						req_i->amount += req_j->amount;
					else if (req_j->type.is_string && req_i->res_str == NULL)
						req_i->res_str = string_dup(req_j->res_str);
				} else { /* This is the first time we've seen this resource */
					resource_req *tmpreq;
					tmpreq = dup_resource_req(req_j);
					tmpreq->next = new_ns->resreq;
					new_ns->resreq = tmpreq;
				}
			}
		}
	}
	return new_nspec_arr;
}

/**
 * @brief
 *		create a node_info array by copying the ninfo pointers out of a nspec array
 *
 * @param[in]	nspec_arr	-	source nspec array
 *
 * @return	new node_info array
 * @retval	NULL	: on error
 *
 */
node_info **
create_node_array_from_nspec(std::vector<nspec *> &nspec_arr)
{
	std::unordered_map<std::string, node_info *> node_umap;
	node_info **ninfo_arr;
	int j = 0;

	if (nspec_arr.empty())
		return NULL;

	if ((ninfo_arr = static_cast<node_info **>(calloc(nspec_arr.size() + 1, sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}

	for (const auto &ns : nspec_arr) {
		if (node_umap.find(ns->ninfo->name) == node_umap.end())
			node_umap[ns->ninfo->name] = ns->ninfo;
	}

	for (const auto &numap : node_umap)
		ninfo_arr[j++] = numap.second;

	return ninfo_arr;
}
/**
 * @brief
 *	reorder the nodes for the avoid_provision or smp_cluster_dist policies
 *	or when the reservation is being altered without changing the source
 * 	array. We do so by holding our own static array of node pointers that
 * 	we will sort for the different policies.
 *
 * @param[in]	nodes	: nodes to reorder
 * @param[in]	resresv : job or reservation for which reorder is done
 *
 * @see	last_node_name - the last allocated node - used for round_robin
 *
 * @return	node_info **
 * @retval	reordered list of nodes if needed
 * @retval	'nodes' parameter if nodes do not need reordering
 * @retval	NULL	: on error
 *
 * @par Side Effects:
 *      local variable node_array holds onto memory in the heap for reuse.
 *      The caller should not free the return
 *
 * @par MT-safe:	No
 *
 * @par MT-safe: No
 */
node_info **
reorder_nodes(node_info **nodes, resource_resv *resresv)
{
	static node_info **node_array = NULL;
	static int node_array_size = 0;
	node_info **nptr = NULL;
	node_info **tmparr = NULL;
	schd_resource *hostres = NULL;
	schd_resource *cur_hostres = NULL;
	int nsize = 0;
	int i = 0;
	int j = 0;
	int k = 0;

	if (nodes == NULL)
		return NULL;

	if (resresv == NULL && conf.provision_policy == AVOID_PROVISION)
		return NULL;

	nsize = count_array(nodes);

	if ((node_array_size < nsize + 1) || node_array == NULL) {
		tmparr = static_cast<node_info **>(realloc(node_array, sizeof(node_info *) * (nsize + 1)));
		if (tmparr == NULL) {
			log_err(errno, __func__, MEM_ERR_MSG);
			return NULL;
		}

		node_array = tmparr;
		node_array_size = nsize + 1;
	}
	tmparr = NULL;

	node_array[0] = NULL;
	nptr = node_array;

	if (last_node_name[0] == '\0' && nodes[0] != NULL)
		pbs_strncpy(last_node_name, nodes[0]->name.c_str(), sizeof(last_node_name));

	if (resresv != NULL) {
		if (resresv->aoename != NULL && conf.provision_policy == AVOID_PROVISION) {
			memcpy(nptr, nodes, (nsize + 1) * sizeof(node_info *));

			if (cmp_aoename != NULL)
				free(cmp_aoename);

			cmp_aoename = string_dup(resresv->aoename);
			qsort(nptr, nsize, sizeof(node_info *), cmp_aoe);

			log_eventf(PBSEVENT_DEBUG3, PBS_EVENTCLASS_JOB, LOG_DEBUG, resresv->name,
				   "Re-sorted the nodes on aoe %s, since aoe was requested", resresv->aoename);

			return nptr;
		}
	}

	switch (cstat.smp_dist) {
		case SMP_NODE_PACK:
			nptr = nodes;
			break;

		case SMP_ROUND_ROBIN:

			if ((tmparr = static_cast<node_info **>(calloc(node_array_size, sizeof(node_info *)))) == NULL) {
				log_err(errno, __func__, MEM_ERR_MSG);
				return NULL;
			}

			memcpy(tmparr, nodes, nsize * sizeof(node_info *));
			qsort(tmparr, nsize, sizeof(node_info *), cmp_node_host);

			for (i = 0; i < nsize && tmparr[i]->name != last_node_name; i++)
				;

			if (i < nsize) {
				/* find the vnode of the next host or the end of the list since the
				 * beginning will definitely be a different host because of our sort
				 */
				hostres = find_resource(tmparr[i]->res, allres["host"]);
				if (hostres != NULL) {
					for (; i < nsize; i++) {
						cur_hostres = find_resource(tmparr[i]->res, allres["host"]);
						if (cur_hostres != NULL) {
							if (!compare_res_to_str(cur_hostres, hostres->str_avail[0], CMP_CASELESS))
								break;
						}
					}
				}
			}

			/* copy from our last location to the end */
			for (j = 0, k = i; k < nsize; j++, k++)
				nptr[j] = tmparr[k];

			/* copy from the beginning to our last location */
			for (k = 0; k < i; j++, k++)
				nptr[j] = tmparr[k];

			nptr[j] = NULL;

			free(tmparr);
			break;

		default:
			nptr = nodes;
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_FILE, LOG_NOTICE, "", "Invalid smp_cluster_dist value");
	}

	return nptr;
}

/**
 * @brief
 *		ok_break_chunk - is it OK to break up a chunk on a list of nodes?
 *
 * @param[in]	resresv	-	the requestor (unused for the moment)
 * @param[in]	nodes   -	the list of nodes to check
 *
 * @return	int
 * @retval	1	: if its OK to break up chunks across the nodes
 * @retval	0	: if it not
 *
 */
int
ok_break_chunk(resource_resv *resresv, node_info **nodes)
{
	int i;
	schd_resource *hostres = NULL;
	schd_resource *res;
	if (resresv == NULL || nodes == NULL)
		return 0;

	for (i = 0; nodes[i] != NULL; i++) {
		res = find_resource(nodes[i]->res, allres["host"]);
		if (res != NULL) {
			if (hostres == NULL)
				hostres = res;
			else {
				if (match_string_array(hostres->str_avail, res->str_avail) != SA_FULL_MATCH) {
					break;
				}
			}
		} else {
			log_event(PBSEVENT_SCHED, PBS_EVENTCLASS_NODE, LOG_WARNING,
				  nodes[i]->name, "Node has no host resource");
		}
	}

	if (nodes[i] == NULL)
		return 1;

	return 0;
}

/**
 * @brief
 *		is_excl - is a request/node combination exclusive?  This is based
 *		  on both the place directive of the request and the
 *		  sharing attribute of the node
 *
 * @param[in]	pl	-	place directive of the request
 * @param[in]	sharing	-	sharing attribute of the node
 *
 * @return	int
 * @retval	1	: if exclusive
 * @retval	0	: if not
 *
 * @note
 *		Assumes if pl is NULL, no request excl/shared request was given
 */
int
is_excl(place *pl, enum vnode_sharing sharing)
{
	if (sharing == VNS_FORCE_EXCL || sharing == VNS_FORCE_EXCLHOST)
		return 1;

	if (sharing == VNS_IGNORE_EXCL)
		return 0;

	if (pl != NULL) {
		if (pl->excl)
			return 1;

		if (pl->share)
			return 0;
	}

	if (sharing == VNS_DFLT_EXCL || sharing == VNS_DFLT_EXCLHOST)
		return 1;

	if (sharing == VNS_DFLT_SHARED)
		return 0;

	return 0;
}

/**
 * @brief
 * 		take a node solution and extend it by allocating the rest of
 *		a node array to it.
 *
 * @param[in][out]	nsa	-	currently allocated node solution to be
 *							extended with ninfo_arr
 * @param[in] ninfo_arr - node array to allocate to nspec array
 *
 * @note
 *		must be allocated by caller
 *
 * @return	int
 * @retval	1	: on success
 * @retval	on error	: nsa may be modified
 *
 */
int
alloc_rest_nodepart(std::vector<nspec *> &nsa, node_info **ninfo_arr)
{
	int max_seq_num = 0;
	if (ninfo_arr == NULL)
		return 0;

	/* find the end of our current node solution.  While we're searching, find
	 * the highest nspec sequence number.  We will use this for the sequence
	 * number for the rest of the nodepart
	 */
	for (const auto &ns : nsa)
		if (ns->seq_num > max_seq_num)
			max_seq_num = ns->seq_num;

	for (int i = 0; ninfo_arr[i] != NULL; i++) {
		const auto ns = find_nspec(nsa, ninfo_arr[i]);

		/* node not part of solution */
		if (ns == NULL) {
			auto nns = new nspec();
			nns->ninfo = ninfo_arr[i];
			nns->end_of_chunk = 1;
			nns->seq_num = max_seq_num;

			nns->sub_seq_num = get_sched_rank();
			nsa.push_back(nns);
		}
	}

	return 1;
}

/**
 * @brief
 * 		determine if a chunk can fit on one vnode in node list
 *
 * @param[in]	req	-	requested resources to compare to nodes
 * @param[in]	ninfo_arr	-	node array
 *
 * @par NOTE:
 * 		all resources in req will be honored regardless of
 * 	    whether they are in conf.res_to_check or not due to the fact
 *		that chunk resources only contain such resources
 *
 * @return	int
 * @retval	1	: chunk can fit in 1 vnode
 * @retval	0	: chunk can not fit / error
 *
 */
int
can_fit_on_vnode(resource_req *req, node_info **ninfo_arr)
{
	int i;
	static schd_error *dumperr = NULL;

	if (req == NULL || ninfo_arr == NULL)
		return 0;

	if (dumperr == NULL) {
		dumperr = new_schd_error();
		if (dumperr == NULL) {
			set_schd_error_codes(dumperr, NOT_RUN, SCHD_ERROR);
			return 0;
		}
	}

	for (i = 0; ninfo_arr[i] != NULL; i++) {
		clear_schd_error(dumperr);

		if (is_vnode_eligible_chunk(req, ninfo_arr[i], NULL, dumperr)) {
			if (check_avail_resources(ninfo_arr[i]->res, req,
						  UNSET_RES_ZERO, INSUFFICIENT_RESOURCE, NULL))
				return 1;
		}
	}

	return 0;
}

/**
 * @brief
 *	Checks if an EOE is available on a vnode
 *
 * @par Functionality:
 *	This function checks if an EOE is available on a vnode.
 *
 * @see
 *
 * @param[in]	ninfo		-	pointer to node_info
 * @param[in]	resresv		-	pointer to resource_resv
 *
 * @return	int
 * @retval	 0 : EOE not available
 * @retval	 1 : EOE available
 *
 * @par Side Effects:
 *	Unknown
 *
 * @par MT-safe: No
 *
 */
int
is_eoe_avail_on_vnode(node_info *ninfo, resource_resv *resresv)
{
	schd_resource *resp;

	if (ninfo == NULL || resresv == NULL)
		return 0;

	if (resresv->eoename == NULL)
		return 0;

	if ((resp = find_resource(ninfo->res, allres["eoe"])) != NULL)
		return is_string_in_arr(resp->str_avail, resresv->eoename);

	return 0;
}

/**
 * @brief
 *		Checks if a vnode is eligible to be provisioned
 *
 * @par Functionality:
 *		This function checks if a vnode is eligible to be provisioned.
 *		A vnode is eligible to be provisioned if it satisfies all of the
 *		following conditions:-
 *			(1) AOE instantiated on the vnode is different from AOE requested by the
 *			the job or reservation,
 *			(2) Server has provisioning enabled,
 *			(3) Vnode has provisioning enabled,
 *			(4) Vnode does not have suspended jobs
 *  		(5) Vnode does not have any running jobs (inside / outside resvs)
 *			(6) No conflicts with reservations already running on the Vnode
 *			(7) No conflicts with jobs already running on the Vnode
 *
 * @see
 *		should_backfill_with_job
 *
 * @param[in]	node		-	pointer to node_info
 * @param[in]	resresv		-	pointer to resource_resv
 * @param[in]	err		-	pointer to schd_error
 *
 * @return	int
 * @retval	NO_PROVISIONING_NEEDED	: resresv doesn't request aoe
 *			or node doesn't need provisioning
 * @retval	PROVISIONING_NEEDED : vnode is provisionable and needs
 *			provisioning
 * @retval	NOT_PROVISIONABLE  : vnode is not provisionable
 *			(see err for more details)
 *
 * @par Side Effects:
 *		Unknown
 *
 * @par MT-safe:	No
 *
 */
int
is_provisionable(node_info *node, resource_resv *resresv, schd_error *err)
{
	int i;
	int ret = NO_PROVISIONING_NEEDED;

	if ((resresv->aoename == NULL && resresv->is_job) ||
	    !resresv->is_prov_needed)
		return NO_PROVISIONING_NEEDED;

	/* Perform checks if job is going to provision now or if reservation has aoe. */
	if ((resresv->is_job && (node->current_aoe == NULL || strcmp(resresv->aoename, node->current_aoe))) ||
	    (resresv->is_resv && resresv->aoename != NULL)) {
		/* we are inside, it means node requires provisioning... */
		ret = PROVISIONING_NEEDED;

		if (node->is_multivnoded) {
			set_schd_error_codes(err, NOT_RUN, IS_MULTI_VNODE);
			return NOT_PROVISIONABLE;
		}

		/* PROV_DISABLE_ON_SERVER is NOT_RUN instead of NEVER RUN.
		 * Even though we can't provision any nodes, there might be
		 * enough nodes in the correct aoe to run the job.
		 */
		if (!resresv->server->provision_enable) {
			set_schd_error_codes(err, NOT_RUN, PROV_DISABLE_ON_SERVER);
			return NOT_PROVISIONABLE;
		}

		if (!node->provision_enable) {
			set_schd_error_codes(err, NOT_RUN, PROV_DISABLE_ON_NODE);
			return NOT_PROVISIONABLE;
		}

		/* Provisioning disallowed if there are suspended jobs on the node */
		if (node->num_susp_jobs > 0) {
			set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
			return NOT_PROVISIONABLE;
		}

		/* if there are running jobs, inside or outside a resv,
		 * disallow prov.
		 */
		if (node->num_jobs > 0) {
			set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
			return NOT_PROVISIONABLE;
		}
	}

	/* node cannot be shared between running reservation without AOE
	 * and job with AOE
	 */
	if (resresv->is_job && node->run_resvs_arr) {
		for (i = 0; node->run_resvs_arr[i]; i++) {
			if (node->run_resvs_arr[i]->aoename == NULL) {
				set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
				return NOT_PROVISIONABLE;
			}
		}
	}

	/* node cannot be shared between running job with AOE
	 * and reservation without AOE
	 */
	if (resresv->is_resv && resresv->aoename == NULL &&
	    node->job_arr) {
		for (i = 0; node->job_arr[i]; i++) {
			if (node->job_arr[i]->aoename != NULL) {
				set_schd_error_codes(err, NOT_RUN, PROV_RESRESV_CONFLICT);
				return NOT_PROVISIONABLE;
			}
		}
	}

	return ret;
}

/**
 * @brief
 *		handles everything which happens to a node when it comes back up
 *
 * @param[in]	node	-	the node to bring back up
 * @param[in]	arg		-	NULL param
 *
 * @par Side Effects:
 * 		Sets the resv-exclusive state if the node had it
 * 		previously set.
 *
 * @par MT-safe:	Unknown
 *
 * @retval	1 - node was successfully brought up
 * @retval	0 - node couldn't be brought up
 *
 */
int
node_up_event(node_info *node, void *arg)
{
	server_info *sinfo;

	if (node == NULL)
		return 0;

	/* Preserve the resv-exclusive state when previously set */
	if (node->is_resv_exclusive)
		set_node_info_state(node, ND_resv_exclusive);
	else
		set_node_info_state(node, ND_free);

	sinfo = node->server;
	if (sinfo->node_group_enable && !sinfo->node_group_key.empty()) {
		node_partition_update_array(sinfo->policy, sinfo->nodepart);
		qsort(sinfo->nodepart, sinfo->num_parts,
		      sizeof(node_partition *), cmp_placement_sets);
	}
	update_all_nodepart(sinfo->policy, sinfo, NO_ALLPART);

	return 1;
}

/**
 * @brief
 *		handles everything which happens to a node when it goes down
 *
 * @param[in]	node	-	node to bring down
 * @param[in]	arg		-	NULL param
 *
 * @par Side Effects: None
 * @par MT-safe: Unknown
 *
 * @return	int
 * @retval	1	: node was successfully brought down
 * @retval	0	: node couldn't be brought down
 *
 */
int
node_down_event(node_info *node, void *arg)
{
	server_info *sinfo;

	if (node == NULL)
		return 0;

	sinfo = node->server;
	if (node->job_arr != NULL) {
		for (int i = 0; node->job_arr[i] != NULL; i++) {
			const char *job_state;

			if (node->job_arr[i]->job->can_requeue)
				job_state = "Q";
			else
				job_state = "X";
			update_universe_on_end(sinfo->policy, node->job_arr[i], job_state, NO_ALLPART);
		}
	}

	set_node_info_state(node, ND_down);

	if (sinfo->node_group_enable && !sinfo->node_group_key.empty()) {
		node_partition_update_array(sinfo->policy, sinfo->nodepart);
		qsort(sinfo->nodepart, sinfo->num_parts,
		      sizeof(node_partition *), cmp_placement_sets);
	}
	update_all_nodepart(sinfo->policy, sinfo, NO_ALLPART);

	return 1;
}

/**
 * @brief
 *		create an array of unique nodes from a names in a string array
 *
 * @param[in]	nodes	-	nodes to create array from
 * @param[in]	strnodes	-	string array of vnode names
 *
 * @return node array
 *
 */
node_info **
create_node_array_from_str(node_info **nodes, char **strnodes)
{
	int i, j;
	node_info **ninfo_arr;
	int cnt;

	if (nodes == NULL || strnodes == NULL)
		return NULL;

	cnt = count_array(strnodes);

	if ((ninfo_arr = static_cast<node_info **>(malloc((cnt + 1) * sizeof(node_info *)))) == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	ninfo_arr[0] = NULL;

	for (i = 0, j = 0; strnodes[i] != NULL; i++) {
		if (find_node_info(ninfo_arr, strnodes[i]) == NULL) {
			ninfo_arr[j] = find_node_info(nodes, strnodes[i]);
			if (ninfo_arr[j] != NULL) {
				j++;
				ninfo_arr[j] = NULL;
			} else
				log_eventf(PBSEVENT_DEBUG2, PBS_EVENTCLASS_NODE, LOG_DEBUG, __func__,
					   "Node %s not found in list.", strnodes[i]);
		}
	}

	return ninfo_arr;
}

/**
 * @brief find a node in the array and return its index
 * @param ninfo_arr - node array
 * @param rank - rank of node to search for
 * @return int
 * @retval 0+ - index in array of node
 * @retval -1 - node not found
 */
int
find_node_ind(node_info **ninfo_arr, int rank)
{
	int i;
	if (ninfo_arr == NULL)
		return -1;

	for (i = 0; ninfo_arr[i] != NULL && ninfo_arr[i]->rank != rank; i++)
		;

	if (ninfo_arr[i] == NULL)
		return -1;

	return i;
}

/**
 * @brief
 * 		find a node by its unique rank
 *
 * @param[in]	ninfo_arr	-	node array to search
 * @param[in] rank	-	unique numeric identifier for node
 *
 * @return	node_info *
 * @retval	found node
 * @retval	NULL	: if node is not found
 */
node_info *
find_node_by_rank(node_info **ninfo_arr, int rank)
{
	int ind;
	if (ninfo_arr == NULL)
		return NULL;

	ind = find_node_ind(ninfo_arr, rank);
	if (ind == -1)
		return NULL;
	return ninfo_arr[ind];
}

/**
 * @brief find a node by indexing into sinfo->unordered_nodes O(1) or
 * 	  by searching for its unique rank O(N) if sinfo->unordered_nodes is unavailable
 *
 * @param[in] ninfo_arr - array of nodes to search
 * @param[in] ind - index into sinfo->unordered_nodes
 * @param[in] rank - node's unique rank
 *
 * @return node_info *
 * @retval found node
 * @retval NULL if node is not found
 */
node_info *
find_node_by_indrank(node_info **ninfo_arr, int ind, int rank)
{
	if (ninfo_arr == NULL || *ninfo_arr == NULL)
		return NULL;

	if (ninfo_arr[0] == NULL || ninfo_arr[0]->server == NULL || ninfo_arr[0]->server->unordered_nodes == NULL || ind == -1)
		return find_node_by_rank(ninfo_arr, rank);

	return ninfo_arr[0]->server->unordered_nodes[ind];
}

/**
 * @brief
 * 		determine if resresv conflicts based on exclhost state of the
 *		future events on this node.
 *
 * @param	calendar - server's calendar of events
 * @param	resresv  - job or resv to check
 * @param	ninfo    - node to check
 *
 * @return int
 * @retval 1	: no excl conflict
 * @retval 0	: future excl conflict
 */
int
sim_exclhost(event_list *calendar, resource_resv *resresv, node_info *ninfo)
{
	time_t end;

	if (calendar == NULL || resresv == NULL || ninfo == NULL)
		return 1;

	if (resresv->duration != resresv->hard_duration &&
	    exists_resv_event(calendar, resresv->hard_duration))
		end = resresv->server->server_time + calc_time_left(resresv, 1);
	else
		end = resresv->server->server_time + calc_time_left(resresv, 0);

	return generic_sim(calendar, TIMED_RUN_EVENT,
			   end, 1, sim_exclhost_func, (void *) resresv, (void *) ninfo);
}
/**
 * @brief
 * 		helper function for generic_sim() to check if an event has an exclhost
 *	  conflict with a job/resv on a node.  We either find a conflict or
 *	  continue looping.
 *
 * @param[in]	te	-	future event
 * @param[in]	arg1	-	job/reservation
 * @param[in]	arg2	- node
 *
 * @return	int
 * @retval	1	: no excl conflict
 * @retval	0	: continue looping
 * @retval	-1	: excl conflict
 */
int
sim_exclhost_func(timed_event *te, void *arg1, void *arg2)
{
	resource_resv *resresv;
	resource_resv *future_resresv;
	node_info *ninfo;

	if (te == NULL || arg1 == NULL || arg2 == NULL)
		return 0;

	resresv = static_cast<resource_resv *>(arg1);
	ninfo = static_cast<node_info *>(arg2);
	future_resresv = static_cast<resource_resv *>(te->event_ptr);
	if (find_nspec_by_rank(future_resresv->nspec_arr, ninfo->rank) == NULL)
		return 0; /* event does not affect the node */

	if (is_exclhost(future_resresv->place_spec, ninfo->sharing) ||
	    is_exclhost(resresv->place_spec, ninfo->sharing)) {
		return -1;
	}

	return 0;
}

/**
 * @brief
 * 		set current_aoe on a node.  Free existing value if set
 *
 * @param[in]	node	-	node to set
 * @paran[in]	aoe	-	aoe to set on ode
 *
 * @return void
 */
void
set_current_aoe(node_info *node, char *aoe)
{
	if (node == NULL)
		return;
	if (node->current_aoe != NULL)
		free(node->current_aoe);
	if (aoe == NULL)
		node->current_aoe = NULL;
	else
		node->current_aoe = string_dup(aoe);
}

/**
 * @brief set current_eoe on a node.  Free existing value if set
 * @param[in] node - node to set
 * @paran[in] eoe - eoe to set on ode
 * @return void
 */
void
set_current_eoe(node_info *node, char *eoe)
{
	if (node == NULL)
		return;
	if (node->current_eoe != NULL)
		free(node->current_eoe);
	if (eoe == NULL)
		node->current_eoe = NULL;
	else
		node->current_eoe = string_dup(eoe);
}

/**
 * @brief
 * 		should we exclhost this job - a function of node sharing and job place
 *
 * @param[in]	sharing	-	the nodes sharing attribute value
 * @param[in]	placespec	-	job place attribute
 *
 * @return	int
 * @retval	1	: do exclhost
 * @retval	0	: don't do exclhost (or invalid input)
 */
int
is_exclhost(place *pl, enum vnode_sharing sharing)
{
	/* if the node forces exclhost, we don't care about the place */
	if (sharing == VNS_FORCE_EXCLHOST)
		return 1;

	/* if the node ignores exclusiveness, we don't care about the place */
	if (sharing == VNS_IGNORE_EXCL)
		return 0;

	/* invalid input */
	if (pl == NULL)
		return 0;

	/* Node defaults to exclhost and the job doesn't disagree */
	if (sharing == VNS_DFLT_EXCLHOST &&
	    pl->excl == 0 && pl->share == 0)
		return 1;

	/* If the job is requesting exclhost */
	if (pl->exclhost)
		return 1;

	/* otherwise we're not doing exclhost */
	return 0;
}

/**
 * @brief	pthread routing to check eligibility for a chunk of nodes
 *
 * @param[in,out]	data - th_data_nd_eligible object
 *
 * @return void
 */
void
check_node_eligibility_chunk(th_data_nd_eligible *data)
{
	int i;
	int start, end;
	schd_error *err;
	schd_error *misc_err;
	resource_resv *resresv;
	place *pl;
	node_info **ninfo_arr;

	if (data == NULL)
		return;

	err = new_schd_error();
	if (err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return;
	}
	misc_err = new_schd_error();
	if (misc_err == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return;
	}

	start = data->sidx;
	end = data->eidx;
	resresv = data->resresv;
	pl = data->pl;
	ninfo_arr = data->ninfo_arr;

	for (i = start; i <= end && ninfo_arr[i] != NULL; i++) {
		node_info *node;

		node = ninfo_arr[i];
		if (!node->nscr) {
			if (is_vnode_eligible(node, resresv, pl, err) == 0) {
				node->nscr |= NSCR_INELIGIBLE;
				if (node->hostset != NULL) {
					if ((err->error_code == NODE_NOT_EXCL && is_exclhost(pl, node->sharing)) || sim_exclhost(resresv->server->calendar, resresv, node) == 0) {
						int j;

						for (j = 0; node->hostset->ninfo_arr[j] != NULL; j++) {
							node_info *n = node->hostset->ninfo_arr[j];
							n->nscr |= NSCR_INELIGIBLE;
							set_schd_error_codes(misc_err, NOT_RUN, NODE_NOT_EXCL);
							schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, n->name,
								   NULL, misc_err);
							clear_schd_error(misc_err);
						}
					}
				}
				if (err->status_code != SCHD_UNKWN) {
					if (misc_err->status_code == SCHD_UNKWN)
						copy_schd_error(misc_err, err);
					schdlogerr(PBSEVENT_DEBUG3, PBS_EVENTCLASS_NODE, LOG_DEBUG, node->name, NULL, err);
				}
				clear_schd_error(err);
			}
		}
	}

	free_schd_error(err);
	data->err = misc_err;
}

/**
 * @brief	 Allocates th_data_nd_eligible for multi-threading of check_node_array_eligibility
 *
 * @param[in]	pl	-	the placement object
 * @param[in]	resresv	-	resresv to check to place on nodes
 * @param[in]	exclerr_buf	-	buffer for not exclusive error message
 * @param[in]	ninfo_arr	-	array to check
 * @param[in]	sidx	-	the start index in ninfo_arr for the thread
 * @param[in]	eidx	-	the end index in ninfo_arr for the thread
 *
 * @return th_data_nd_eligible *
 * @retval a newly allocated th_data_nd_eligible object
 * @retval NULL for malloc error
 */
static inline th_data_nd_eligible *
alloc_tdata_nd_eligible(place *pl, resource_resv *resresv, node_info **ninfo_arr,
			int sidx, int eidx)
{
	th_data_nd_eligible *tdata;

	tdata = static_cast<th_data_nd_eligible *>(malloc(sizeof(th_data_nd_eligible)));
	if (tdata == NULL) {
		log_err(errno, __func__, MEM_ERR_MSG);
		return NULL;
	}
	tdata->err = NULL;
	tdata->pl = pl;
	tdata->resresv = resresv;
	tdata->ninfo_arr = ninfo_arr;
	tdata->sidx = sidx;
	tdata->eidx = eidx;

	return tdata;
}

/**
 * @brief
 * 		check nodes for eligibility and mark them ineligible if not
 *
 * @param[in]	ninfo_arr	-	array to check
 * @param[in]	resresv	-	resresv to check to place on nodes
 * @param[in]	num_nodes - count of no. of nodes
 * @param[out]	err	-	error structure
 *
 * @warning
 * 		If an error occurs in this function, no indication will be returned.
 *		This is not a huge concern because, it will just cause more work to be done.
 *
 * @return	void
 */
void
check_node_array_eligibility(node_info **ninfo_arr, resource_resv *resresv, place *pl, schd_error *err)
{
	th_data_nd_eligible *tdata = NULL;
	th_task_info *task = NULL;
	int tid;
	int num_nodes;

	if (ninfo_arr == NULL || resresv == NULL || pl == NULL || err == NULL)
		return;

	num_nodes = count_array(ninfo_arr);

	tid = *((int *) pthread_getspecific(th_id_key));
	if (tid != 0 || num_threads <= 1) {
		/* don't use multi-threading if I am a worker thread or num_threads is 1 */
		tdata = alloc_tdata_nd_eligible(pl, resresv, ninfo_arr, 0, num_nodes - 1);
		if (tdata == NULL)
			return;
		check_node_eligibility_chunk(tdata);
		copy_schd_error(err, tdata->err);
		free_schd_error(tdata->err);
		free(tdata);
	} else { /* We are multithreading */
		int j;
		int num_tasks;
		int chunk_size = num_nodes / num_threads;
		chunk_size = (chunk_size > MT_CHUNK_SIZE_MIN) ? chunk_size : MT_CHUNK_SIZE_MIN;
		for (j = 0, num_tasks = 0; num_nodes > 0;
		     num_tasks++, j += chunk_size, num_nodes -= chunk_size) {
			tdata = alloc_tdata_nd_eligible(pl, resresv, ninfo_arr, j, j + chunk_size - 1);
			if (tdata == NULL)
				break;

			task = static_cast<th_task_info *>(malloc(sizeof(th_task_info)));
			if (task == NULL) {
				free(tdata);
				log_err(errno, __func__, MEM_ERR_MSG);
				break;
			}
			task->task_type = TS_IS_ND_ELIGIBLE;
			task->thread_data = (void *) tdata;

			queue_work_for_threads(task);
		}

		/* Get results from worker threads */
		for (int i = 0; i < num_tasks;) {
			pthread_mutex_lock(&result_lock);
			while (ds_queue_is_empty(result_queue))
				pthread_cond_wait(&result_cond, &result_lock);
			while (!ds_queue_is_empty(result_queue)) {
				task = static_cast<th_task_info *>(ds_dequeue(result_queue));
				tdata = static_cast<th_data_nd_eligible *>(task->thread_data);
				if (err->status_code == SCHD_UNKWN && tdata->err->status_code != SCHD_UNKWN)
					copy_schd_error(err, tdata->err);

				free_schd_error(tdata->err);
				free(tdata);
				free(task);
				i++;
			}
			pthread_mutex_unlock(&result_lock);
		}
	}
}

/**
 * @brief
 *	node_in_partition	-  Tells whether the given node belongs to this scheduler
 *
 * @param[in]	ninfo		-  node information
 * @param[in]	partition	-  partition associated to scheduler
 *
 *
 * @return	int
 * @retval	1	: if success
 * @retval	0	: if failure
 */
int
node_in_partition(node_info *ninfo, char *partition)
{
	if (dflt_sched) {
		if (ninfo->partition == NULL)
			return 1;
		else
			return 0;
	}
	if (ninfo->partition == NULL)
		return 0;

	if (strcmp(partition, ninfo->partition) == 0)
		return 1;
	else
		return 0;
}

/**
 * @brief add an event to all the nodes associated to a calendar event
 * @param te - event
 * @param nspecs - nspecs[i]->node is the node to add the event to
 * @return bool
 * @retval true success
 * @retval false error
 */
bool
add_event_to_nodes(timed_event *te, std::vector<nspec *> &nspecs)
{
	if (te == NULL)
		return false;

	for (auto ns : nspecs) {
		te_list *tel;
		te_list *pre_tel = NULL;
		te_list *cur_tel;
		tel = new_te_list();
		if (tel == NULL)
			return false;
		tel->event = te;
		for (cur_tel = ns->ninfo->node_events; cur_tel != NULL && cur_tel->event->event_time <= te->event_time; cur_tel = cur_tel->next)
			pre_tel = cur_tel;
		if (pre_tel != NULL)
			pre_tel->next = tel;
		else {
			tel->next = ns->ninfo->node_events;
			ns->ninfo->node_events = tel;
		}
	}
	return true;
}

/**
 * @brief function pointer argument to generic_sim() to add an event to nodes
 * @param te - event
 * @param arg1 - unused
 * @param arg2 - unused
 * @return @see generic_sim()
 */
int
add_node_events(timed_event *te, void *arg1, void *arg2)
{
	if (!te->disabled) {
		auto nspecs = (static_cast<resource_resv *>(te->event_ptr))->nspec_arr;

		if (add_event_to_nodes(te, nspecs) == 0)
			return -1;
	}

	return 0;
}