/* * Registers for process death messages for the specified process name * This will be used by the mxosrvrs and mxocfg process'es to register * for mxoas death messages, instead of polling every 15 seconds to * check if the mxoas process is still around */ bool RegisterProcessDeathMessage(char *processName) { int ferr; // file system errors int nid; // node id int pid; // process id ferr = msg_mon_get_process_info(processName,&nid,&pid); if(ferr != XZFIL_ERR_OK || nid == -1 || pid == -1) return false; ferr = msg_mon_register_death_notification(nid, pid); if(ferr != XZFIL_ERR_OK) return false; } /* RegisterProcessDeathMessage() */
bool is_backup() { int ferr; MS_Mon_Process_Info_Type proc_info; ferr = msg_mon_get_process_info_detail(gname, &proc_info); TEST_CHK_FEOK(ferr); gnid = proc_info.nid; gpid = proc_info.pid; bool backup = proc_info.backup ? true : false; if (backup) { ferr = msg_mon_register_death_notification(proc_info.parent_nid, proc_info.parent_pid); assert(ferr == XZFIL_ERR_OK); } return backup; }
bool pp_is_backup() { bool backup; int disable; int ferr; MS_Mon_Node_Info_Type node_info; MS_Mon_Process_Info_Type proc_info; ferr = msg_mon_get_process_info_detail(gname, &proc_info); TEST_CHK_FEOK(ferr); gnid = proc_info.nid; gpid = proc_info.pid; backup = proc_info.backup ? true : false; if (backup) { gpeer_nid = proc_info.parent_nid; gpeer_pid = proc_info.parent_pid; // set this up in case register fails strcpy(gdisplay_name, gname); sprintf(&gdisplay_name[strlen(gdisplay_name)], "-%d-%d-%d-B", gnid, gpid, getpid()); if (gverbosepp) pp_printf("we are the backup process.\n"); disable = msg_test_assert_disable(); ferr = msg_mon_register_death_notification(gpeer_nid, gpeer_pid); if (ferr != XZFIL_ERR_OK) { if (gverbosepp) pp_printf("msg_mon_register_death_notification FAILED ferr=%d.\n", ferr); ferr = msg_mon_get_node_info_detail(gpeer_nid, &node_info); myassert(ferr == XZFIL_ERR_OK); if (gverbosepp) pp_printf("node-state=%d.\n", node_info.node[0].state); if (node_info.node[0].state == MS_Mon_State_Shutdown) gshutdown = true; } msg_test_assert_enable(disable); } return backup; }
int main(int argc, char *argv[]) { char cli[10]; bool closer; int disable; int event_len; int ferr; int inst = 0; int inx; int lerr; int loop = 10; int msgid; int nid; int oid; TPT_DECL (phandle); int pid; char recv_buffer[30000]; RT results; char send_buffer[10]; MS_SRE sre; TAD zargs[] = { { "-client", TA_Ign, TA_NOMAX, NULL }, { "-inst", TA_Int, TA_NOMAX, &inst }, { "-loop", TA_Int, TA_NOMAX, &loop }, { "-maxcp", TA_Int, TA_NOMAX, &maxcp }, { "-maxs", TA_Int, TA_NOMAX, &maxs }, { "-maxsp", TA_Next, TA_NOMAX, NULL }, { "-name", TA_Next, TA_NOMAX, NULL }, { "-server", TA_Ign, TA_NOMAX, NULL }, { "-v", TA_Bool, TA_NOMAX, &verbose }, { "", TA_End, TA_NOMAX, NULL } }; msfs_util_init(&argc, &argv, msg_debug_hook); arg_proc_args(zargs, false, argc, argv); util_test_start(true); ferr = msg_mon_process_startup(true); // system messages? TEST_CHK_FEOK(ferr); ferr = msg_mon_get_my_process_name(my_name, sizeof(my_name)); TEST_CHK_FEOK(ferr); msg_mon_enable_mon_messages(true); // process-wait for clients/shell // (needed so msg_mon_register_death_notification below works correctly) ferr = msfs_util_wait_process_count(MS_ProcessType_TSE, maxcp, NULL, false); TEST_CHK_FEOK(ferr); sleep(1); if (verbose) printf("%s: inst=%d, maxcp=%d\n", my_name, inst, maxcp); closer = (inst == (maxcp -1)); if (closer && (maxcp > 1)) { if (verbose) printf("%s: register-death-notifications\n", my_name); for (inx = 0; inx < (maxcp - 1); inx++) { sprintf(cli, "$c%d", inx); ferr = msg_mon_get_process_info(cli, &nid, &pid); TEST_CHK_FEOK(ferr); ferr = msg_mon_register_death_notification(nid, pid); TEST_CHK_FEOK(ferr); } } // // wait here until all clients sync-up // (needed so msg_mon_register_death_notification above works correctly) // ferr = msg_mon_event_send(-1, // nid -1, // pid MS_ProcessType_TSE, // process-type 3, // event-id 0, // event-len NULL); // event-data TEST_CHK_FEOK(ferr); for (inx = 0; inx < maxcp; inx++) { ferr = msg_mon_event_wait(3, &event_len, event_data); TEST_CHK_FEOK(ferr); } disable = msg_test_assert_disable(); // check process-type range ferr = msg_mon_event_send(-1, // nid -1, // pid -1, // process-type 4, // event-id 0, // event-len NULL); // event-data assert(ferr == XZFIL_ERR_BOUNDSERR); ferr = msg_mon_event_send(-1, // nid -1, // pid MS_ProcessType_SMS + 1, // process-type 5, // event-id 0, // event-len NULL); // event-data assert(ferr == XZFIL_ERR_BOUNDSERR); msg_test_assert_enable(disable); ferr = msg_mon_open_process((char *) "$srv", // name TPT_REF(phandle), &oid); TEST_CHK_FEOK(ferr); for (inx = 0; inx < loop; inx++) { ferr = XMSG_LINK_(TPT_REF(phandle), // phandle &msgid, // msgid NULL, // reqctrl 0, // reqctrlsize NULL, // replyctrl 0, // replyctrlmax send_buffer, // reqdata 1, // reqdatasize recv_buffer, // replydata 0, // replydatamax 0, // linkertag 0, // pri 0, // xmitclass 0); // linkopts util_check("XMSG_LINK_", ferr); ferr = XMSG_BREAK_(msgid, results.u.s, TPT_REF(phandle)); util_check("XMSG_BREAK_", ferr); } if (closer) { inx = 0; while (inx < (maxcp - 1)) { do { lerr = XWAIT(LREQ, -1); TEST_CHK_WAITIGNORE(lerr); lerr = XMSG_LISTEN_((short *) &sre, // sre 0, // listenopts 0); // listenertag } while (lerr == XSRETYPE_NOWORK); if (sre.sre_flags & XSRE_MON) { ferr = BMSG_READDATA_(sre.sre_msgId, // msgid recv_buffer, // reqdata BUFSIZ); // bytecount TEST_CHK_FEOK(ferr); MS_Mon_Msg *msg = (MS_Mon_Msg *) recv_buffer; if (msg->type == MS_MsgType_ProcessDeath) { if (verbose) printf("%s: process death process=%s\n", my_name, msg->u.death.process_name); inx++; } } XMSG_REPLY_(sre.sre_msgId, // msgid NULL, // replyctrl 0, // replyctrlsize recv_buffer, // replydata 0, // replydatasize 0, // errorclass NULL); // newphandle } if (verbose) printf("%s: sending stop\n", my_name); for (inx = 0; inx < maxs; inx++) { ferr = XMSG_LINK_(TPT_REF(phandle), // phandle &msgid, // msgid NULL, // reqctrl 0, // reqctrlsize NULL, // replyctrl 0, // replyctrlmax send_buffer, // reqdata 0, // reqdatasize recv_buffer, // replydata 0, // replydatamax 0, // linkertag 0, // pri 0, // xmitclass 0); // linkopts util_check("XMSG_LINK_", ferr); ferr = XMSG_BREAK_(msgid, results.u.s, TPT_REF(phandle)); util_check("XMSG_BREAK_", ferr); } } ferr = msg_mon_close_process(TPT_REF(phandle)); TEST_CHK_FEOK(ferr); ferr = msg_mon_process_shutdown(); TEST_CHK_FEOK(ferr); util_test_finish(true); return 0; }
int main(int argc, char *argv[]) { int exit; int ferr; bool ldone; int lerr; int msgid; int nid; int oid; int pid; TPT_DECL (phandle); char recv_buffer[BUFSIZ]; short recv_buffer2[BUFSIZ]; RT results; MS_SRE sre; MS_Mon_Transid_Type transid; ferr = msfs_util_init_role(true, &argc, &argv, msg_debug_hook); TEST_CHK_FEOK(ferr); util_test_start(true); ferr = msg_mon_process_startup(true); // system messages TEST_CHK_FEOK(ferr); msg_mon_enable_mon_messages(true); ferr = msg_mon_get_process_info((char *) "$srv", &nid, &pid); TEST_CHK_FEOK(ferr); ferr = msg_mon_open_process((char *) "$srv", // name TPT_REF(phandle), &oid); TEST_CHK_FEOK(ferr); TRANSID_SET_NULL(transid); ferr = msg_mon_deregister_death_notification(nid, pid, transid); TEST_CHK_FEOK(ferr); ferr = msg_mon_register_death_notification(nid, pid); TEST_CHK_FEOK(ferr); ferr = XMSG_LINK_(TPT_REF(phandle), // phandle &msgid, // msgid NULL, // reqctrl 0, // reqctrlsize recv_buffer2, // replyctrl 1, // replyctrlmax NULL, // reqdata 0, // reqdatasize recv_buffer, // replydata BUFSIZ, // replydatamax 0, // linkertag 0, // pri 0, // xmitclass XMSG_LINK_LDONEQ); // linkopts util_check("XMSG_LINK_", ferr); exit = 0; ldone = false; while (!exit) { do { lerr = XWAIT(LREQ|LDONE, -1); TEST_CHK_WAITIGNORE(lerr); if (lerr == LDONE) { ldone = true; break; } lerr = XMSG_LISTEN_((short *) &sre, // sre 0, // listenopts 0); // listenertag } while (lerr == XSRETYPE_NOWORK); if (ldone) { printf("LINK done\n"); lerr = XMSG_LISTEN_((short *) &sre, // sre XLISTEN_ALLOW_LDONEM, // listenopts 0); // listenertag assert(lerr == XSRETYPE_LDONE); ferr = XMSG_BREAK_(sre.sre_msgId, results.u.s, TPT_REF(phandle)); assert(ferr == XZFIL_ERR_OK); break; } ferr = XMSG_READDATA_(sre.sre_msgId, // msgid recv_buffer, // reqdata BUFSIZ); // bytecount util_check("XMSG_READDATA_", ferr); if (sre.sre_flags & XSRE_MON) { MS_Mon_Msg *msg = (MS_Mon_Msg *) recv_buffer; printf("cli: mon message, type=%d\n", msg->type); if (msg->type == MS_MsgType_ProcessDeath) { assert(msg->u.death.nid == nid); assert(msg->u.death.pid == pid); exit = 1; } else if (msg->type == MS_MsgType_Shutdown) { printf("cli: received cluster shutdown, level=%d\n", msg->u.shutdown.level); assert(msg->u.shutdown.level==MS_Mon_ShutdownLevel_Immediate); } } else printf("cli: NON-mon message\n"); XMSG_REPLY_(sre.sre_msgId, // msgid NULL, // replyctrl 0, // replyctrlsize NULL, // replydata 0, // replydatasize 0, // errorclass NULL); // newphandle } ferr = msg_mon_process_shutdown(); TEST_CHK_FEOK(ferr); util_test_finish(true); return 0; }