- 论坛徽章:
- 0
|
这个是我以前写的, 你看看
使用shm 作为监视进程, 监视另一个进程运行, 如果被监视进程异常退出, 则重启被监视进程
步骤:
1. 由监视进程启动被监视进程 monitor ./app app_argv_0 app_argv_1, monitor最好是daemon形式
2. app 通过 open-> ftok-> shmget-> shmat 建立shm并写入预定内容
3. monitor 等待 app稳定
4. monitor 通过 ftok-> shmget-> shmat 读取shm 内容并比较,
如果app运行正常则清空shm, 重复第四步, 否则跳至第一步
#include <sys/types.h>
#include <sys/stat.h>
#include <fcntl.h>
#include <sys/ipc.h>
#include <sys/shm.h>
#include <sys/types.h>
#include <unistd.h>
#include <stdio.h>
#include <signal.h>
#include <sys/wait.h>
//===================================
// defined in common.h
typedef struct {
int magic;
} wd_msg_t;
#define WD_MSG_FILE_KEY "/dev/shm/myshm2"
#define WD_MSG_MAGIC_NUM 0x12348765
#define WD_MSG_SHM_SIZE 256
//===================================
static void sigint_handler(int sig);
static void shm_wd_uninit(void);
static void exec_app(char* app, char** argv);
static wd_msg_t *p_msg = NULL;
static int shm_id;
static int exit_flg = 0;
static pid_t pid_app = 0;
//monitor ./app app_argv_0 app_argv_1
int main(int argc, char** argv)
{
key_t key;
char* name = WD_MSG_FILE_KEY;
int i;
char* store_argv[128];
char* store_app;
int fd;
if (argc < 2)
return 0;
//store parameter
store_app = argv[1];
for (i = 2; i < argc; i++)
{
store_argv[i - 2] = argv[i];
}
store_argv[i - 2] = NULL;
// SIGINT
struct sigaction act, oldact;
act.sa_handler = sigint_handler;
sigemptyset(&act.sa_mask);
act.sa_flags = 0;
sigaction(SIGINT, &act, &oldact);
// create shm
fd = open(name, O_RDWR|O_CREAT, S_IRUSR | S_IWUSR);
if (fd == -1)
perror("open error");
key = ftok(name,0);
if (key==-1)
perror("ftok error");
shm_id=shmget(key, WD_MSG_SHM_SIZE ,IPC_CREAT|IPC_EXCL|0666 );
if (shm_id==-1)
{
perror("MONITOR shmget error");
return 0;
}
p_msg=(wd_msg_t*)shmat(shm_id,NULL,0);
if ((int)p_msg == -1)
{
perror("MONITOR shmat error");
return 0;
}
exec_app(store_app, store_argv);
int err_cnt = 0;
int status;
while (1)
{
if (p_msg->magic == WD_MSG_MAGIC_NUM)
{
err_cnt = 0;
printf("===ok===\n");
p_msg->magic = 0;
}
else
{
printf("===error===\n");
if (++err_cnt >= 3)
{
// kill app & restart
if (pid_app > 0)
{
kill( pid_app,SIGKILL );
waitpid( pid_app, &status, WNOHANG ); // obtain information about the child
}
exec_app(store_app, store_argv);
}
}
sleep(2);
if (exit_flg)
break;
}
shm_wd_uninit();
return 0;
}
static void sigint_handler(int sig)
{
printf("===end===\n");
exit_flg = 1;
}
static void shm_wd_uninit(void)
{
if (shmdt(p_msg)==-1)
perror("MONITOR detach error ");
shmctl( shm_id, IPC_RMID, NULL );
}
static void exec_app(char* app, char** argv)
{
int status;
pid_app = fork();
if (pid_app == -1) /* fork出错 */
{
perror("MONITOR fork error ");
}
else if (pid_app == 0) /* fork返回0表示处于子进程 */
{
printf("In child process!!\n My PID is %d\n",getpid());
execv(app, argv);
}
else
{
puts( "in parent" );
waitpid( pid_app, &status, WNOHANG );
}
}
|
|
|