static stepd_step_rec_t * _step_setup(slurm_addr_t *cli, slurm_addr_t *self, slurm_msg_t *msg) { stepd_step_rec_t *job = NULL; switch (msg->msg_type) { case REQUEST_BATCH_JOB_LAUNCH: debug2("setup for a batch_job"); job = mgr_launch_batch_job_setup(msg->data, cli); break; case REQUEST_LAUNCH_TASKS: debug2("setup for a launch_task"); job = mgr_launch_tasks_setup(msg->data, cli, self, msg->protocol_version); break; default: fatal("handle_launch_message: Unrecognized launch RPC"); break; } if (!job) { error("_step_setup: no job returned"); return NULL; } job->jmgr_pid = getpid(); job->jobacct = jobacctinfo_create(NULL); /* Establish GRES environment variables */ if (conf->debug_flags & DEBUG_FLAG_GRES) { gres_plugin_job_state_log(job->job_gres_list, job->jobid); gres_plugin_step_state_log(job->step_gres_list, job->jobid, job->stepid); } if (msg->msg_type == REQUEST_BATCH_JOB_LAUNCH) gres_plugin_job_set_env(&job->env, job->job_gres_list, 0); else if (msg->msg_type == REQUEST_LAUNCH_TASKS) gres_plugin_step_set_env(&job->env, job->step_gres_list, 0); /* * Add slurmd node topology informations to job env array */ env_array_overwrite(&job->env,"SLURM_TOPOLOGY_ADDR", conf->node_topo_addr); env_array_overwrite(&job->env,"SLURM_TOPOLOGY_ADDR_PATTERN", conf->node_topo_pattern); set_msg_node_id(job); return job; }
/* * main - slurmctld main function, start various threads and process RPCs * test7.17.prog <TRES_PER_NODE> <CONFIG_DIR_HEAD> <CONFIG_SUB_DIR> <CPU_COUNT> * */ int main(int argc, char *argv[]) { log_options_t opts = LOG_OPTS_STDERR_ONLY; int rc; uint32_t cpu_count, cpu_alloc, job_id = 12345; char *node_name, *reason_down = NULL; char *orig_config, *new_config = NULL, *tres_per_node = NULL; Buf buffer; List job_gres_list = NULL, node_gres_list = NULL; bitstr_t *cpu_bitmap; char config_dir[10000], test[1000]; char slurm_conf[1000]; uint32_t num_tasks = 1; uint32_t min_nodes = 1; uint32_t max_nodes = 1; uint16_t ntasks_per_node = NO_VAL16; uint16_t ntasks_per_socket = NO_VAL16; uint16_t sockets_per_node = NO_VAL16; uint16_t cpus_per_task = NO_VAL16; int core_count, sock_count; /* Setup slurm.conf and gres.conf test paths */ strcpy(config_dir, argv[2]); strcpy(config_dir,strcat(config_dir, "/test7.17_configs")); strcpy(test, strcat(config_dir, argv[3])); strcpy(slurm_conf, strcat(test, "/slurm.conf")); /* Enable detailed logging for now */ opts.stderr_level = LOG_LEVEL_DEBUG; log_init(argv[0], opts, SYSLOG_FACILITY_USER, NULL); /* * Logic normally executed by slurmd daemon */ setenv("SLURM_CONF", slurm_conf, 1); rc = gres_plugin_init(); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_init"); exit(1); } setenv("SLURM_CONFIG_DIR", config_dir, 1); cpu_count = strtol(argv[4], NULL, 10); node_name = "test_node"; rc = gres_plugin_node_config_load(cpu_count, node_name, NULL, NULL, NULL); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_node_config_load"); exit(1); } buffer = init_buf(1024); rc = gres_plugin_node_config_pack(buffer); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_node_config_pack"); exit(1); } /* * Logic normally executed by slurmctld daemon */ orig_config = "gpu:8"; rc = gres_plugin_init_node_config(node_name, orig_config, &node_gres_list); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_init_node_config"); exit(1); } set_buf_offset(buffer, 0); rc = gres_plugin_node_config_unpack(buffer, node_name); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_node_config_unpack"); exit(1); } core_count = cpu_count; sock_count = 1; rc = gres_plugin_node_config_validate(node_name, orig_config, &new_config, &node_gres_list, cpu_count, core_count, sock_count, 0, &reason_down); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_node_config_validate"); exit(1); } if (argc > 2) tres_per_node = xstrdup(argv[1]); rc = gres_plugin_job_state_validate(NULL, /* cpus_per_tres */ NULL, /* tres_freq */ NULL, /* tres_per_job */ tres_per_node, NULL, /* tres_per_socket */ NULL, /* tres_per_task */ NULL, /* mem_per_tres */ &num_tasks, &min_nodes, &max_nodes, &ntasks_per_node, &ntasks_per_socket, &sockets_per_node, &cpus_per_task, &job_gres_list); if (rc != SLURM_SUCCESS) { slurm_seterrno(rc); slurm_perror("failure: gres_plugin_job_state_validate"); exit(1); } gres_plugin_node_state_log(node_gres_list, node_name); gres_plugin_job_state_log(job_gres_list, job_id); cpu_bitmap = bit_alloc(cpu_count); bit_nset(cpu_bitmap, 0, cpu_count - 1); cpu_alloc = gres_plugin_job_test(job_gres_list, node_gres_list, true, cpu_bitmap, 0, cpu_count - 1, job_id, node_name); if (cpu_alloc == NO_VAL) printf("cpu_alloc=ALL\n"); else printf("cpu_alloc=%u\n", cpu_alloc); rc = gres_plugin_fini(); if (rc != SLURM_SUCCESS) { slurm_perror("failure: gres_plugin_fini"); exit(1); } printf("Test %s ran to completion\n\n", argv[3]); exit(0); }