免费注册 查看新帖 |

Chinaunix

  平台 论坛 博客 文库
最近访问板块 发新帖
查看: 1148 | 回复: 0
打印 上一主题 下一主题

linux 1.0 内核注解 linux/fs/namei.c [复制链接]

论坛徽章:
0
跳转到指定楼层
1 [收藏(0)] [报告]
发表于 2009-05-07 13:26 |只看该作者 |倒序浏览
/********************************************
*Created By: 陶治江
*Date:       2009年5月3日21:35:49
********************************************/

#include
#include
#include
#include
#include
#include
#include
//获得权限的宏,例如
//"\000\004\002\006";事实上是一个匿名常量字符串或(常量字符数组)      
//cout   
/*
* In order to reduce some races, while at the same time doing additional
* checking and hopefully speeding things up, we copy filenames to the
* kernel data space before using them..
*
* POSIX.1 2.4: an empty pathname is invalid (ENOENT).
*/
//将filename处的用户空间的文件名拷贝到result内核空间中
//文件名最多只能占一个页面大小
int getname(const char * filename, char **result)
{
int error;
unsigned long i, page;
char * tmp, c;
i = (unsigned long) filename;
if (!i || i >= TASK_SIZE)  //TASK_SIZE=0xc0000000,表示filename地址应该是用户空间的地址
  return -EFAULT;
i = TASK_SIZE - i;   
error = -EFAULT;

if (i > PAGE_SIZE) {
  i = PAGE_SIZE;
  error = -ENAMETOOLONG;
}
c = get_fs_byte(filename++);
if (!c)    //POSIX.1 2.4: an empty pathname is invalid (ENOENT)
  return -ENOENT;
if(!(page = __get_free_page(GFP_KERNEL)))
  return -ENOMEM;
*result = tmp = (char *) page;

while (--i) {
  *(tmp++) = c;
  c = get_fs_byte(filename++);  //检测文件名'\0'结束
  if (!c) {
   *tmp = '\0';
   return 0;
  }
}

free_page(page);
return error;
}
void putname(char * name)
{
free_page((unsigned long) name);
}
//权限的检查,可见权限检查的检查操作也可以被封装到了底层了
//返回1表示OK
int permission(struct inode * inode,int mask)
{
int mode = inode->i_mode;
if (inode->i_op && inode->i_op->permission)
  return inode->i_op->permission(inode, mask);
  
//表示节点结构中没有权限检查操作,下面进行常规的实现
else if (current->euid == inode->i_uid) /*当前进程用户就是节点的拥有者*/
  mode >>= 6;
else if (in_group_p(inode->i_gid))
  mode >>= 3;

/*表明mode&0007操作的结果能够提供mask操作,成功了*/
if (((mode & mask & 0007) == mask) || suser())
  return 1;
return 0;
}
/*
* lookup() looks up one part of a pathname, using the fs-dependent
* routines (currently minix_lookup) for it. It also checks for
* fathers (pseudo-roots, mount-points)
*/
int lookup(struct inode * dir,const char * name, int len,
struct inode ** result)
{
struct super_block * sb;
int perm;
*result = NULL;
if (!dir)
  return -ENOENT;
/* check permissions before traversing mount-points */
perm = permission(dir,MAY_EXEC); //这里告诉我们目录的遍历查找需要执行的权限!!

/* -bash-3.00$ pwd
/home/f/o/taozhijiang/mydocument
-bash-3.00$ cd /home/f/o/taozhijiang/mydocument/..
-bash-3.00$ pwd
/home/f/o/taozhijiang
*/
if (len==2 && name[0] == '.' && name[1] == '.') { /*'..',查找父目录*/
  if (dir == current->root) { /*如果已经是根设备了,就返回根设备*/
   *result = dir;
   return 0;
  } else if ((sb = dir->i_sb) && (dir == sb->s_mounted)) {
   sb = dir->i_sb;  //why special for ..???
   iput(dir);
   dir = sb->s_covered;
   if (!dir)
    return -ENOENT;
   dir->i_count++;
  }
}

if (!dir->i_op || !dir->i_op->lookup) {
  iput(dir);
  return -ENOTDIR;
}
  if (!perm) {
  iput(dir);
  return -EACCES;
}
if (!len) {  //  '/usr/'这类了
  *result = dir;
  return 0;
}
return dir->i_op->lookup(dir,name,len,result);
}
int follow_link(struct inode * dir, struct inode * inode,
int flag, int mode, struct inode ** res_inode)
{
if (!dir || !inode) {
  iput(dir);
  iput(inode);
  *res_inode = NULL;
  return -ENOENT;
}
if (!inode->i_op || !inode->i_op->follow_link) {
  iput(dir);
  *res_inode = inode;
  return 0;
}
return inode->i_op->follow_link(dir,inode,flag,mode,res_inode);
}
/////
//这个文件中理解dir_namei namei的区别是很重要的
//dir_namei返回的是最底层的"目录"的节点信息,而其他的
//参数输出是该目录下的文件信息,而namei就是最底层的文件的信息了
////
//下面是论坛中的解释
/*
那么比如说 有一个pathname为  abc/def/ghi/jk
dir_namei返回的是ghi节点,文件名jk(不管jk是目录还是文件)和jk的长度.
namei 返回的是jk节点*/
/*
* dir_namei()
*
* dir_namei() returns the inode of the directory of the
* specified name, and the name within that directory.
*/
//返回指定目录的inode,并且返回该目录下的文件的长度和名字,而
//不管这个文件的类型(当然'/usr/')这样的路径参数就需要注意了!
static int dir_namei(const char * pathname, int * namelen, const char ** name,
struct inode * base, struct inode ** res_inode)
{
char c;
const char * thisname;
int len,error;
struct inode * inode;
*res_inode = NULL;
if (!base) {
  base = current->pwd;
  base->i_count++;
}
if ((c = *pathname) == '/') {  //从根目录开始遍寻
  iput(base);
  base = current->root;
  pathname++;   //移过 /
  base->i_count++;
}

while (1)
{
  thisname = pathname;  //提取单个目录名
  for(len=0;(c = *(pathname++))&&(c != '/');len++)
   /* nothing */ ;
  if (!c)  //此时len和pathname(thisname)的数据在参数返回
   break;
  base->i_count++;
  error = lookup(base,thisname,len,&inode);
  if (error) {
   iput(base);
   return error;
  }
  
  //估计的作用就是更新base节点
  error = follow_link(base,inode,0,0,&base);
  if (error)
   return error;
}

if (!base->i_op || !base->i_op->lookup) {
  iput(base);
  return -ENOTDIR;
}
*name = thisname;
*namelen = len;
*res_inode = base;
return 0;
}
static int _namei(const char * pathname, struct inode * base,
int follow_links, struct inode ** res_inode)
{
const char * basename;
int namelen,error;
struct inode * inode;
*res_inode = NULL;
error = dir_namei(pathname,&namelen,&basename,base,&base);
if (error)
  return error;
base->i_count++; /* lookup uses up base */
error = lookup(base,basename,namelen,&inode);
if (error) {
  iput(base);
  return error;
}
if (follow_links) {
  error = follow_link(base,inode,0,0,&inode);
  if (error)
   return error;
} else
  iput(base);
*res_inode = inode;
return 0;
}
//区别就是follow_link标志了
int lnamei(const char * pathname, struct inode ** res_inode)
{
int error;
char * tmp;
error = getname(pathname,&tmp);
if (!error) {
  error = _namei(tmp,NULL,0,res_inode);
  putname(tmp);  //free_page释放空间
}
return error;
}
/*
* namei()
*
* is used by most simple commands to get the inode of a specified name.
* Open, link etc use their own routines, but this is enough for things
* like 'chmod' etc.
*/
//follow a pathname until a terminal point is found  
int namei(const char * pathname, struct inode ** res_inode)
{
int error;
char * tmp;
error = getname(pathname,&tmp);
if (!error) {
  error = _namei(tmp,NULL,1,res_inode);
  putname(tmp);
}
return error;
}
/*
* open_namei()
*
* namei for open - this is in fact almost the whole open-routine.
*
* Note that the low bits of "flag" aren't the same as in the open
* system call - they are 00 - no permissions needed
*     01 - read permission needed
*     10 - write permission needed
*     11 - read/write permissions needed
* which is a lot more logical, and also allows the "no perm" needed
* for symlinks (where the permissions are checked later).
*/
int open_namei(const char * pathname, int flag, int mode,
struct inode ** res_inode, struct inode * base)
{
const char * basename;
int namelen,error;
struct inode * dir, *inode;
struct task_struct ** p;
mode &= S_IALLUGO & ~current->umask;
mode |= S_IFREG;  //Regular file
error = dir_namei(pathname,&namelen,&basename,base,&dir);
if (error)
  return error;
if (!namelen) {   /* special case: '/usr/' etc */  
  if (flag & 2) {  //要检查写权限?
   iput(dir);
   return -EISDIR;
  }
  /* thanks to Paul Pluzhnikov for noticing this was missing.. */
  if (!permission(dir,ACC_MODE(flag))) {
   iput(dir);
   return -EACCES;
  }
  *res_inode=dir;
  return 0;
}
dir->i_count++;  /* lookup eats the dir */

//是否创建
if (flag & O_CREAT) {
  down(&dir->i_sem);
  error = lookup(dir,basename,namelen,&inode);
  if (!error) { //原来的文件存在
   if (flag & O_EXCL) {  //在创建文件时把它设置为独占(O_EXCL)模式
          //(O_EXCL模式在文件已存在的情况下通常会失败)
          //或许已经存在就不创建了吧
    iput(inode);
    error = -EEXIST;
   }
  } else if (!permission(dir,MAY_WRITE | MAY_EXEC))
   error = -EACCES;
  else if (!dir->i_op || !dir->i_op->create)
   error = -EACCES;
  else if (IS_RDONLY(dir))
   error = -EROFS;
  else {
   dir->i_count++;  /* create eats the dir */
   error = dir->i_op->create(dir,basename,namelen,mode,res_inode);
   up(&dir->i_sem);
   iput(dir);
   return error;
  }
  up(&dir->i_sem);
} else  //不创建
  error = lookup(dir,basename,namelen,&inode);
  
if (error) {
  iput(dir);
  return error;
}
error = follow_link(dir,inode,flag,mode,&inode);
if (error)
  return error;
if (S_ISDIR(inode->i_mode) && (flag & 2)) {  //当pathname指向的是目录时候,是不允许写的
  iput(inode);
  return -EISDIR;
}
if (!permission(inode,ACC_MODE(flag))) {
  iput(inode);
  return -EACCES;
}
if (S_ISBLK(inode->i_mode) || S_ISCHR(inode->i_mode)) {
  if (IS_NODEV(inode)) {  //device special file
   iput(inode);
   return -EACCES;
  }
} else {
  if (IS_RDONLY(inode) && (flag & 2)) {
   iput(inode);
   return -EROFS;
  }
}
  if ((inode->i_count > 1) && (flag & 2)) {
   for (p = &LAST_TASK ; p > &FIRST_TASK ; --p)
   {
          struct vm_area_struct * mpnt;
    if (!*p)
     continue;
   
    // pathname  refers to an executable image which is currently being
            // executed and write access was requested.
    if (inode == (*p)->executable) { //被执行的镜像
     iput(inode);
     return -ETXTBSY;
    }
   
   for(mpnt = (*p)->mmap; mpnt; mpnt = mpnt->vm_next) {
    if (mpnt->vm_page_prot & PAGE_RW) //可写
     continue;
     
    //不可写的内存
    if (inode == mpnt->vm_inode) {
     iput(inode);
     return -ETXTBSY;
    }
   }
   }
  }
if (flag & O_TRUNC) {
       inode->i_size = 0;  //截断文件
       if (inode->i_op && inode->i_op->truncate)
            inode->i_op->truncate(inode);
       if ((error = notify_change(NOTIFY_SIZE, inode))) {
     iput(inode);
     return error;
       }
       inode->i_dirt = 1;
}
*res_inode = inode;
return 0;
}
int do_mknod(const char * filename, int mode, dev_t dev)
{
const char * basename;
int namelen, error;
struct inode * dir;
mode &= ~current->umask;
error = dir_namei(filename,&namelen,&basename, NULL, &dir);
if (error)
  return error;
if (!namelen) {
  iput(dir);
  return -ENOENT;
}
if (IS_RDONLY(dir)) {
  iput(dir);
  return -EROFS;
}
if (!permission(dir,MAY_WRITE | MAY_EXEC)) { //目录的写和执行权限
  iput(dir);
  return -EACCES;
}
if (!dir->i_op || !dir->i_op->mknod) {
  iput(dir);
  return -EPERM;
}

//原子操作,信号量,目前不是很懂
//POSIX有信号量,SysV IPC有信号量,核内也有信号量,接口很简单,一个down(),一个up(),
//分别对应P操作和V操作,down()调用可能引起线程挂起,因此和sleep_on类似,
//也有interruptible系列接口。down意味着信号量减1,up意味着信号量加1,这两个操作显然需要互斥
down(&dir->i_sem);
error = dir->i_op->mknod(dir,basename,namelen,mode,dev);
up(&dir->i_sem);
return error;
}
//mknod makes a directory entry for a special file
//一般是为字符设备,块设备或者是管道进行创建的
asmlinkage int sys_mknod(const char * filename, int mode, dev_t dev)
{
int error;
char * tmp;
if (S_ISDIR(mode) || (!S_ISFIFO(mode) && !suser())) //不能是目录
  return -EPERM;
  
switch (mode & S_IFMT) { //文件类型掩码,下面进行检验,可见S_IFREG常规文件标志是必须得
case 0:
  mode |= S_IFREG;
  break;
case S_IFREG: case S_IFCHR: case S_IFBLK: case S_IFIFO:
  break;
default:
  return -EINVAL;
}
error = getname(filename,&tmp);
if (!error) {
  error = do_mknod(tmp,mode,dev);
  putname(tmp);
}
return error;
}
static int do_mkdir(const char * pathname, int mode)
{
const char * basename;
int namelen, error;
struct inode * dir;
error = dir_namei(pathname,&namelen,&basename,NULL,&dir);
if (error)
  return error;
if (!namelen) {
  iput(dir);
  return -ENOENT;
}
if (IS_RDONLY(dir)) {
  iput(dir);
  return -EROFS;
}
if (!permission(dir,MAY_WRITE | MAY_EXEC)) {  //记住,创建目录就需要有目录的写和执行权限
  iput(dir);
  return -EACCES;
}
if (!dir->i_op || !dir->i_op->mkdir) {
  iput(dir);
  return -EPERM;
}
down(&dir->i_sem);
error = dir->i_op->mkdir(dir,basename,namelen,mode);
up(&dir->i_sem);
return error;
}
asmlinkage int sys_mkdir(const char * pathname, int mode)
{
int error;
char * tmp;
error = getname(pathname,&tmp);
if (!error) {
  error = do_mkdir(tmp,mode);
  putname(tmp);
}
return error;
}
static int do_rmdir(const char * name)
{
const char * basename;
int namelen, error;
struct inode * dir;
error = dir_namei(name,&namelen,&basename,NULL,&dir);
if (error)
  return error;
if (!namelen) {
  iput(dir);
  return -ENOENT;
}
if (IS_RDONLY(dir)) {
  iput(dir);
  return -EROFS;
}
if (!permission(dir,MAY_WRITE | MAY_EXEC)) {
  iput(dir);
  return -EACCES;
}
if (!dir->i_op || !dir->i_op->rmdir) {
  iput(dir);
  return -EPERM;
}
return dir->i_op->rmdir(dir,basename,namelen);
}
asmlinkage int sys_rmdir(const char * pathname)
{
int error;
char * tmp;
error = getname(pathname,&tmp);
if (!error) {
  error = do_rmdir(tmp);
  putname(tmp);
}
return error;
}
static int do_unlink(const char * name)
{
const char * basename;
int namelen, error;
struct inode * dir;
error = dir_namei(name,&namelen,&basename,NULL,&dir);
if (error)
  return error;
if (!namelen) {
  iput(dir);
  return -EPERM;
}
if (IS_RDONLY(dir)) {
  iput(dir);
  return -EROFS;
}
if (!permission(dir,MAY_WRITE | MAY_EXEC)) {
  iput(dir);
  return -EACCES;
}
if (!dir->i_op || !dir->i_op->unlink) {
  iput(dir);
  return -EPERM;
}
return dir->i_op->unlink(dir,basename,namelen);
}
asmlinkage int sys_unlink(const char * pathname)
{
int error;
char * tmp;
error = getname(pathname,&tmp);
if (!error) {
  error = do_unlink(tmp);
  putname(tmp);
}
return error;
}
//符号连接(软连接)
static int do_symlink(const char * oldname, const char * newname)
{
struct inode * dir;
const char * basename;
int namelen, error;
error = dir_namei(newname,&namelen,&basename,NULL,&dir);
if (error)
  return error;
if (!namelen) {
  iput(dir);
  return -ENOENT;
}
if (IS_RDONLY(dir)) {
  iput(dir);
  return -EROFS;
}
if (!permission(dir,MAY_WRITE | MAY_EXEC)) {
  iput(dir);
  return -EACCES;
}
if (!dir->i_op || !dir->i_op->symlink) {
  iput(dir);
  return -EPERM;
}
down(&dir->i_sem);
error = dir->i_op->symlink(dir,basename,namelen,oldname);
up(&dir->i_sem);
return error;
}
asmlinkage int sys_symlink(const char * oldname, const char * newname)
{
int error;
char * from, * to;
//原目录和目的目录都要能被索引到
error = getname(oldname,&from);
if (!error) {
  error = getname(newname,&to);
  if (!error) {
   error = do_symlink(from,to);
   putname(to);
  }
  putname(from);
}
return error;
}
//硬链接
static int do_link(struct inode * oldinode, const char * newname)
{
struct inode * dir;
const char * basename;
int namelen, error;
error = dir_namei(newname,&namelen,&basename,NULL,&dir);
if (error) {
  iput(oldinode);
  return error;
}
if (!namelen) {
  iput(oldinode);
  iput(dir);
  return -EPERM;
}
if (IS_RDONLY(dir)) {
  iput(oldinode);
  iput(dir);
  return -EROFS;
}

//呃,硬链接的限制了,同一个设备(文件系统?)
if (dir->i_dev != oldinode->i_dev) {
  iput(dir);
  iput(oldinode);
  return -EXDEV;
}
if (!permission(dir,MAY_WRITE | MAY_EXEC)) {
  iput(dir);
  iput(oldinode);
  return -EACCES;
}
if (!dir->i_op || !dir->i_op->link) {
  iput(dir);
  iput(oldinode);
  return -EPERM;
}
down(&dir->i_sem);
error = dir->i_op->link(oldinode, dir, basename, namelen);
up(&dir->i_sem);
return error;
}
asmlinkage int sys_link(const char * oldname, const char * newname)
{
int error;
char * to;
struct inode * oldinode;
error = namei(oldname, &oldinode);
if (error)
  return error;
error = getname(newname,&to);
if (error) {
  iput(oldinode);
  return error;
}
error = do_link(oldinode,to);
putname(to);
return error;
}
static int do_rename(const char * oldname, const char * newname)
{
struct inode * old_dir, * new_dir;
const char * old_base, * new_base;
int old_len, new_len, error;
error = dir_namei(oldname,&old_len,&old_base,NULL,&old_dir);
if (error)
  return error;
if (!permission(old_dir,MAY_WRITE | MAY_EXEC)) {
  iput(old_dir);
  return -EACCES;
}

//特殊的,就是. 和 .. 不能被重新命令的
if (!old_len || (old_base[0] == '.' &&
     (old_len == 1 || (old_base[1] == '.' &&
      old_len == 2)))) {
  iput(old_dir);
  return -EPERM;
}

error = dir_namei(newname,&new_len,&new_base,NULL,&new_dir);
if (error) {
  iput(old_dir);
  return error;
}
if (!permission(new_dir,MAY_WRITE | MAY_EXEC)) {
  iput(old_dir);
  iput(new_dir);
  return -EACCES;
}
if (!new_len || (new_base[0] == '.' &&
     (new_len == 1 || (new_base[1] == '.' &&
      new_len == 2)))) {
  iput(old_dir);
  iput(new_dir);
  return -EPERM;
}
if (new_dir->i_dev != old_dir->i_dev) {  //这个是肯定的
  iput(old_dir);
  iput(new_dir);
  return -EXDEV;
}
if (IS_RDONLY(new_dir) || IS_RDONLY(old_dir)) {
  iput(old_dir);
  iput(new_dir);
  return -EROFS;
}
if (!old_dir->i_op || !old_dir->i_op->rename) {
  iput(old_dir);
  iput(new_dir);
  return -EPERM;
}
down(&new_dir->i_sem);  //调用原先节点的rename函数
error = old_dir->i_op->rename(old_dir, old_base, old_len,
  new_dir, new_base, new_len);
up(&new_dir->i_sem);
return error;
}
asmlinkage int sys_rename(const char * oldname, const char * newname)
{
int error;
char * from, * to;
error = getname(oldname,&from);
if (!error) {
  error = getname(newname,&to);
  if (!error) {
   error = do_rename(from,to);
   putname(to);
  }
  putname(from);
}
return error;
}

文档地址:
http://blogimg.chinaunix.net/blog/upfile2/090503233213.pdf


本文来自ChinaUnix博客,如果查看原文请点:http://blog.chinaunix.net/u3/90306/showart_1921144.html
您需要登录后才可以回帖 登录 | 注册

本版积分规则 发表回复

  

北京盛拓优讯信息技术有限公司. 版权所有 京ICP备16024965号-6 北京市公安局海淀分局网监中心备案编号:11010802020122 niuxiaotong@pcpop.com 17352615567
未成年举报专区
中国互联网协会会员  联系我们:huangweiwei@itpub.net
感谢所有关心和支持过ChinaUnix的朋友们 转载本站内容请注明原作者名及出处

清除 Cookies - ChinaUnix - Archiver - WAP - TOP