《linux 内核完全剖析》 exit.c 代码分析笔记
时间:2014-05-07 23:35:51
收藏:0
阅读:576
exit.c 代码分析笔记
release
释放进程的函数release() 主要根据指定进程的任务数据结构指针,在任务数组中删除指定的进程指针,释放相关内存页,并立刻让内核重新调度进程的运行。
void release(struct task_struct * p) //释放p指向的进程 { int i; if (!p) //常规检测p是否为0 return; if (p == current) { //不能把自己给释放了 printk("task releasing itself\n\r"); return; } for (i=1 ; i<NR_TASKS ; i++) //扫描所有的进程 if (task[i]==p) { //找出p进程 task[i]=NULL; //把p置空 /* Update links */ if (p->p_osptr) //调整链表 p->p_osptr->p_ysptr = p->p_ysptr; if (p->p_ysptr) p->p_ysptr->p_osptr = p->p_osptr; else p->p_pptr->p_cptr = p->p_osptr; free_page((long)p); //释放p进程占用的内存页 schedule();//任务调度 return; } panic("trying to release non-existent task"); }
bad_task_ptr 和audit_ptree
#ifdef DEBUG_PROC_TREE //下面这部分代码是调试用的 /* * Check to see if a task_struct pointer is present in the task[] array * Return 0 if found, and 1 if not found. */ int bad_task_ptr(struct task_struct *p) { int i; if (!p) return 0; for (i=0 ; i<NR_TASKS ; i++) if (task[i] == p) return 0; return 1; //如果p不在task数组里面,那这个指针就有问题! } /* * This routine scans the pid tree and make sure the rep invarient still * holds. Used for debugging only, since it‘s very slow.... * * It looks a lot scarier than it really is.... we‘re doing ?nothing more * than verifying the doubly-linked list found?in p_ysptr and p_osptr, * and checking it corresponds with the process tree defined by p_cptr and * p_pptr; */ void audit_ptree() //其实不难,就是打印进程树的相关信息,方便调试用 { int i; for (i=1 ; i<NR_TASKS ; i++) { if (!task[i]) continue; if (bad_task_ptr(task[i]->p_pptr)) printk("Warning, pid %d‘s parent link is bad\n", task[i]->pid); if (bad_task_ptr(task[i]->p_cptr)) printk("Warning, pid %d‘s child link is bad\n", task[i]->pid); if (bad_task_ptr(task[i]->p_ysptr)) printk("Warning, pid %d‘s ys link is bad\n", task[i]->pid); if (bad_task_ptr(task[i]->p_osptr)) printk("Warning, pid %d‘s os link is bad\n", task[i]->pid); if (task[i]->p_pptr == task[i]) printk("Warning, pid %d parent link points to self\n"); if (task[i]->p_cptr == task[i]) printk("Warning, pid %d child link points to self\n"); if (task[i]->p_ysptr == task[i]) printk("Warning, pid %d ys link points to self\n"); if (task[i]->p_osptr == task[i]) printk("Warning, pid %d os link points to self\n"); if (task[i]->p_osptr) { if (task[i]->p_pptr != task[i]->p_osptr->p_pptr) printk( "Warning, pid %d older sibling %d parent is %d\n", task[i]->pid, task[i]->p_osptr->pid, task[i]->p_osptr->p_pptr->pid); if (task[i]->p_osptr->p_ysptr != task[i]) printk( "Warning, pid %d older sibling %d has mismatched ys link\n", task[i]->pid, task[i]->p_osptr->pid); } if (task[i]->p_ysptr) { if (task[i]->p_pptr != task[i]->p_ysptr->p_pptr) printk( "Warning, pid %d younger sibling %d parent is %d\n", task[i]->pid, task[i]->p_osptr->pid, task[i]->p_osptr->p_pptr->pid); if (task[i]->p_ysptr->p_osptr != task[i]) printk( "Warning, pid %d younger sibling %d has mismatched os link\n", task[i]->pid, task[i]->p_ysptr->pid); } if (task[i]->p_cptr) { if (task[i]->p_cptr->p_pptr != task[i]) printk( "Warning, pid %d youngest child %d has mismatched parent link\n", task[i]->pid, task[i]->p_cptr->pid); if (task[i]->p_cptr->p_ysptr) printk( "Warning, pid %d youngest child %d has non-NULL ys link\n", task[i]->pid, task[i]->p_cptr->pid); } } } #endif /* DEBUG_PROC_TREE */
send_sig
static inline int send_sig(long sig,struct task_struct * p,int priv) //给进程p,发送信号。priv 是强制发送信号的标识 { if (!p) //常规的p非空检测 return -EINVAL; if (!priv && (current->euid!=p->euid) && !suser()) //如果不具有超级用户权限,又不是当前session里面的进程,且没有强制发送信号,进入if,return return -EPERM; if ((sig == SIGKILL) || (sig == SIGCONT)) { //如果要发送的信号是SIGKILL或者SIGCONT if (p->state == TASK_STOPPED) //如果当前进程处于stop状态,则将其置于TASK_RUNNING状态 p->state = TASK_RUNNING; p->exit_code = 0; p->signal &= ~( (1<<(SIGSTOP-1)) | (1<<(SIGTSTP-1)) | (1<<(SIGTTIN-1)) | (1<<(SIGTTOU-1)) ); //消除SIGSTOP SIGTSTP SIGTTIN SIGTTOU } /* If the signal will be ignored, don‘t even post it */ if ((int) p->sigaction[sig-1].sa_handler == 1) //如果handler是 ignore 就不要送信号鸟。。 return 0; /* Depends on order SIGSTOP, SIGTSTP, SIGTTIN, SIGTTOU */ if ((sig >= SIGSTOP) && (sig <= SIGTTOU)) //如果信号含有 SIGSTOP, SIGTSTP, SIGTTIN, SIGTTOU其中任何信号,那么就消除SIGCONT信号 p->signal &= ~(1<<(SIGCONT-1)); /* Actually deliver the signal */ p->signal |= (1<<(sig-1)); //最后这里才把信号写入信号变量 return 0; }
session_of_pgrp
int session_of_pgrp(int pgrp) //获取process group的session ID ,没有找到返回-1 { struct task_struct **p; for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) if ((*p)->pgrp == pgrp) return((*p)->session); return -1; }
kill_pg
int kill_pg(int pgrp, int sig, int priv) //给指定的进程组发送信号 { struct task_struct **p; int err,retval = -ESRCH; //指定的进程不存在 int found = 0; if (sig<1 || sig>32 || pgrp<=0) return -EINVAL; for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) if ((*p)->pgrp == pgrp) { //对每一个属于process group的进程发送信号sig if (sig && (err = send_sig(sig,*p,priv))) retval = err; else found++; } return(found ? 0 : retval); }
kill_proc
int kill_proc(int pid, int sig, int priv) //给指定进程发送信号 { struct task_struct **p; if (sig<1 || sig>32) return -EINVAL; for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) if ((*p)->pid == pid) return(sig ? send_sig(sig,*p,priv) : 0); return(-ESRCH); }
sys_kill
系统调用sys_kill 用于项进程发送任何指定的信号,根据参数pid不同的数值,该系统调用会向不同的进或进程组发送信号。
/* * POSIX specifies that kill(-1,sig) is unspecified, but what we have * is probably wrong. Should make it like BSD or SYSV. */ int sys_kill(int pid,int sig) { struct task_struct **p = NR_TASKS + task; int err, retval = 0; if (!pid) //如果是进程0 init ,用最高权限发送信号,将信号发送给当前进程所处进程组的所有进程 return(kill_pg(current->pid,sig,0)); if (pid == -1) { //如果 pid是-1,把信号发送到除了init进程外的所有进程! while (--p > &FIRST_TASK) if (err = send_sig(sig,*p,0)) retval = err; return(retval); } if (pid < 0) //如果pid<0,发送到|pid| 所处进程组的所有进程 return(kill_pg(-pid,sig,0)); /* Normal kill */ return(kill_proc(pid,sig,0)); //否则,发送到进程pid }
is_orphaned_pgrp
/* * Determine if a process group is "orphaned", according to the POSIX * definition in 2.2.2.52. Orphaned process groups are not to be affected * by terminal-generated stop signals. Newly orphaned process groups are * to receive a SIGHUP and a SIGCONT. * * "I ask you, have you ever known what it is to be an orphan?" */ int is_orphaned_pgrp(int pgrp) //判断是否为一个孤儿进程组 { struct task_struct **p; for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) { if (!(*p) || //如果进程不存在,下一个 ((*p)->pgrp != pgrp) || // 如果进程所处的进程组不是pgrp,下一个 ((*p)->state == TASK_ZOMBIE) || // 进程的状态是zombie,下一个 ((*p)->p_pptr->pid == 1)) //进程parent是init ,下一个 continue; if (((*p)->p_pptr->pgrp != pgrp) && //如果父进程所在的组不在pgrp,但是父进程所在的session存在 ((*p)->p_pptr->session == (*p)->session)) return 0; } return(1); /* (sighing) "Often!" */ }
has_stopped_jobs
static int has_stopped_jobs(int pgrp) //判断进程组内是否有进程处于TASK_STOPPED状态 { struct task_struct ** p; for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) { if ((*p)->pgrp != pgrp) continue; if ((*p)->state == TASK_STOPPED) return(1); } return(0); }
do_exit
volatile void do_exit(long code) { struct task_struct *p; int i; free_page_tables(get_base(current->ldt[1]),get_limit(0x0f)); free_page_tables(get_base(current->ldt[2]),get_limit(0x17)); /*这里采用的两个参数0x0f即1111B,因此他指向的段优先级为3,存储在LDT表中,索引为1。也就是当前任务段的代码段描述符。 另外一个参数0x17即10111B,因此他指向的段优先级为3,存储在LDT表中,索引为2.也就是当前任务的数及堆栈段描述符。 这样,通过get_limit(0x0f)和get_limit(0x17)就得到了当前任务代码段和数据堆栈段的长度。 因此, free_page_tables(get_base(current->ldt[1]),get_limit(0x0f)); free_page_tables(get_base(current->ldt[2]),get_limit(0x17));就释放了当前任务的代码段和数据堆栈段。*/ for (i=0 ; i<NR_OPEN ; i++) if (current->filp[i]) //filp文件结构指针表,filp[i]就是文件i被打开的ID sys_close(i); //关闭进程当前打开的文件 iput(current->pwd); //和fs inode有关系 current->pwd = NULL; //当前进程的工作目录置为NULL iput(current->root);//和fs inode有关系 current->root = NULL;//当前进程的根目录置为NULL iput(current->executable);//和fs inode有关系 current->executable = NULL;//当前进程的执行程序文件的i节点置为NULL iput(current->library);//和fs inode有关系 current->library = NULL;//当前进程的库文件置为NULL current->state = TASK_ZOMBIE; //状态置为TASK_ZOMBIE current->exit_code = code; //设置进程退出码 /* * Check to see if any process groups have become orphaned * as a result of our exiting, and if they have any stopped * jobs, send them a SIGUP and then a SIGCONT. (POSIX 3.2.2.2) * * Case i: Our father is in a different pgrp than we are * and we were the only connection outside, so our pgrp * is about to become orphaned. */ if ((current->p_pptr->pgrp != current->pgrp) && (current->p_pptr->session == current->session) && is_orphaned_pgrp(current->pgrp) && has_stopped_jobs(current->pgrp)) { //如果当前进程组是个orphaned group kill_pg(current->pgrp,SIGHUP,1); //用于只是这些进程和当前session 断开联系,我这里不是很明白为什么要发送SIGHUP 和 SIGCONT kill_pg(current->pgrp,SIGCONT,1); } /* Let father know we died */ current->p_pptr->signal |= (1<<(SIGCHLD-1)); // 告诉parent process 当前进程要挂掉鸟 /* * This loop does two things: * * A. Make init inherit all the child processes * B. Check to see if any process groups have become orphaned * as a result of our exiting, and if they have any stopped * jons, send them a SIGUP and then a SIGCONT. (POSIX 3.2.2.2) */ if (p = current->p_cptr) { //如果当前进程的child process 非空,进入if while (1) { p->p_pptr = task[1]; //让init进程领养current 进程的child 进程 if (p->state == TASK_ZOMBIE) //p进程沦为zombie task[1]->signal |= (1<<(SIGCHLD-1)); //向init进程发送SIGCHLD信号 /* * process group orphan check * Case ii: Our child is in a different pgrp * than we are, and it was the only connection * outside, so the child pgrp is now orphaned. */ if ((p->pgrp != current->pgrp) && (p->session == current->session) && is_orphaned_pgrp(p->pgrp) && has_stopped_jobs(p->pgrp)) { //判断p进程所在进程组是否是orphaned group,如果是。发送SIGHUP和SIGCONT信号 kill_pg(p->pgrp,SIGHUP,1); kill_pg(p->pgrp,SIGCONT,1); } if (p->p_osptr) { //如果p_osptr非空,则把p->p_osptr赋值给p p = p->p_osptr; continue; //下一轮循环,知道p_osptr为NULL } /* * This is it; link everything into init‘s children * and leave */ p->p_osptr = task[1]->p_cptr; task[1]->p_cptr->p_ysptr = p; task[1]->p_cptr = current->p_cptr; //这三句把这个child process —— p 更新为 init 进程的 最年轻的child process current->p_cptr = 0; //处理完所有的child process ,把 当前进程的p_cptr置为NULL break; //处理完了跳出while } } if (current->leader) { //如果当前进程是session leader struct task_struct **p; struct tty_struct *tty; if (current->tty >= 0) { //切断当前进程和terminal 的联系 tty = TTY_TABLE(current->tty); //tty 还没看布吉岛。。。 if (tty->pgrp>0) kill_pg(tty->pgrp, SIGHUP, 1); tty->pgrp = 0; tty->session = 0; } for (p = &LAST_TASK ; p > &FIRST_TASK ; --p) //把所有和当前进程同一个session的进程的tty都置为-1 if ((*p)->session == current->session) (*p)->tty = -1; } if (last_task_used_math == current) //数字协处理器木有看。。。布吉岛, //但是语句的意思是上次用过协处理器的进程是当前进程的话酒吧last_task_used_math 置为NULL last_task_used_math = NULL; #ifdef DEBUG_PROC_TREE audit_ptree(); #endif schedule(); //进程调度 }
sys_exit
int sys_exit(int error_code) //系统调用sys_exit函数,通过调用do_exit 函数来实现 { do_exit((error_code&0xff)<<8); //error_code是用户程序提供的退出状态信息,只有低字节有效 //把error_code 左移八位是空出第八位供wait()和waitpid()函数使用 }
sys_waitpid
用于挂起当前进程,知道pid指定的进程退出或者收到要求该进程终止的信号,或者是需要调用一个signal handler。如果pid 所指的进程早已退出(zombie)则本调用立刻返回。子进程的所有资源将被释放。
int sys_waitpid(pid_t pid,unsigned long * stat_addr, int options) //其实我一般都木有怎么用stat_addr 这边选项,一般我都NULL了 <—_<— //waitpid居然放在。。。exit.c 里,木有别的,只有惊奇 { int flag; struct task_struct *p; unsigned long oldblocked; verify_area(stat_addr,4); //验证stat_addr 地址处4byte 可写 repeat: flag=0; for (p = current->p_cptr ; p ; p = p->p_osptr) { if (pid>0) { if (p->pid != pid) //找到pid描述的child进程的指针 continue; } else if (!pid) { //如果pid等于0, 找到pid 所在的进程组 if (p->pgrp != current->pgrp) continue; } else if (pid != -1) { //如果pid < -1 ,找到|pid|所在的进程组 if (p->pgrp != -pid) continue; } // 如果以上判断田间都没进if去,pid = -1 ,这里不是很明白,看完fork之后回头再update switch (p->state) { case TASK_STOPPED: //如果进程p处于TASK_STOPPED状态 if (!(options & WUNTRACED) || //如果option的WUNTRACED 没有置位或者 exit_code 等于0 ,对下一个older child进行检测 !p->exit_code) continue; put_fs_long((p->exit_code << 8) | 0x7f, stat_addr);//把第一个参数写入第二个参数指向的地址 p->exit_code = 0; //正常退出 return p->pid; //返回结束child 的pid case TASK_ZOMBIE: current->cutime += p->utime; current->cstime += p->stime; //更新时间参数 flag = p->pid; put_fs_long(p->exit_code, stat_addr); //把p->exit_code 写入stat_addr release(p); //释放进程p占用的内存页 #ifdef DEBUG_PROC_TREE audit_ptree(); #endif return flag; default: flag=1; continue; } } if (flag) { //存在不处于TASK_STOPPED 和TASK_ZOMBIE状态的进程 if (options & WNOHANG) //如果WNOHANG(表示若没有子进程处于退出或者终止状态就返回)在options中置位,就立刻返回0; return 0; //一般我是不会用WNOHANG的。。。坦白的说我都没用过 current->state=TASK_INTERRUPTIBLE; //更新进程状态,置为TASK_INTERRUPTIBLE oldblocked = current->blocked; //当前进程阻塞的信号储存于oldblocked中 current->blocked &= ~(1<<(SIGCHLD-1)); //消除当前进程中的SIGCHLD信号 schedule();//进程调度 current->blocked = oldblocked; //回复原来的信号图 if (current->signal & ~(current->blocked | (1<<(SIGCHLD-1))))//如果收到了除了SIGCHLD之外的其他信号,return 挂掉 return -ERESTARTSYS; else goto repeat; //否则goto到repeat 继续重复,直到return 出去。。。。。原来是这样waitpid的啊! } return -ECHILD; //没有找到pid对应的child process,返回错误码 }
评论(0)