[CIFS] Fix spurious reconnect on 2nd peek from read of SMB length

[safe/jmp/linux-2.6] / fs / namei.c
diff --git a/fs/namei.c b/fs/namei.c

index 8c2db88..3b993db 100644 (file)
--- a/fs/namei.c
+++ b/fs/namei.c
@@ -22,7 +22,6 @@
  #include <linux/quotaops.h>
  #include <linux/pagemap.h>
  #include <linux/fsnotify.h>
-#include <linux/smp_lock.h>
  #include <linux/personality.h>
  #include <linux/security.h>
  #include <linux/syscalls.h>
@@ -31,7 +30,6 @@
  #include <linux/capability.h>
  #include <linux/file.h>
  #include <linux/fcntl.h>
-#include <linux/namei.h>
  #include <asm/namei.h>
  #include <asm/uaccess.h>
  
@@ -108,6 +106,8 @@
   * any extra contention...
   */
  
+static int fastcall link_path_walk(const char *name, struct nameidata *nd);
+
  /* In order to reduce some races, while at the same time doing additional
   * checking and hopefully speeding things up, we copy filenames to the
   * kernel data space before using them..
@@ -227,10 +227,14 @@ int generic_permission(struct inode *inode, int mask,
  
  int permission(struct inode *inode, int mask, struct nameidata *nd)
  {
-       umode_t mode = inode->i_mode;
         int retval, submask;
+       struct vfsmount *mnt = NULL;
+
+       if (nd)
+               mnt = nd->mnt;
  
         if (mask & MAY_WRITE) {
+               umode_t mode = inode->i_mode;
  
                 /*
                  * Nobody gets write access to a read-only fs.
@@ -246,22 +250,34 @@ int permission(struct inode *inode, int mask, struct nameidata *nd)
                         return -EACCES;
         }
  
-
-       /*
-        * MAY_EXEC on regular files requires special handling: We override
-        * filesystem execute permissions if the mode bits aren't set or
-        * the fs is mounted with the "noexec" flag.
-        */
-       if ((mask & MAY_EXEC) && S_ISREG(mode) && (!(mode & S_IXUGO) ||
-                       (nd && nd->mnt && (nd->mnt->mnt_flags & MNT_NOEXEC))))
-               return -EACCES;
+       if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode)) {
+               /*
+                * MAY_EXEC on regular files is denied if the fs is mounted
+                * with the "noexec" flag.
+                */
+               if (mnt && (mnt->mnt_flags & MNT_NOEXEC))
+                       return -EACCES;
+       }
  
         /* Ordinary permission routines do not understand MAY_APPEND. */
         submask = mask & ~MAY_APPEND;
-       if (inode->i_op && inode->i_op->permission)
+       if (inode->i_op && inode->i_op->permission) {
                 retval = inode->i_op->permission(inode, submask, nd);
-       else
+               if (!retval) {
+                       /*
+                        * Exec permission on a regular file is denied if none
+                        * of the execute bits are set.
+                        *
+                        * This check should be done by the ->permission()
+                        * method.
+                        */
+                       if ((mask & MAY_EXEC) && S_ISREG(inode->i_mode) &&
+                           !(inode->i_mode & S_IXUGO))
+                               return -EACCES;
+               }
+       } else {
                 retval = generic_permission(inode, submask, NULL);
+       }
         if (retval)
                 return retval;
  
@@ -297,7 +313,7 @@ int vfs_permission(struct nameidata *nd, int mask)
   */
  int file_permission(struct file *file, int mask)
  {
-       return permission(file->f_dentry->d_inode, mask, NULL);
+       return permission(file->f_path.dentry->d_inode, mask, NULL);
  }
  
  /*
@@ -333,7 +349,7 @@ int get_write_access(struct inode * inode)
  
  int deny_write_access(struct file * file)
  {
-       struct inode *inode = file->f_dentry->d_inode;
+       struct inode *inode = file->f_path.dentry->d_inode;
  
         spin_lock(&inode->i_lock);
         if (atomic_read(&inode->i_writecount) > 0) {
@@ -368,7 +384,7 @@ void path_release_on_umount(struct nameidata *nd)
   */
  void release_open_intent(struct nameidata *nd)
  {
-       if (nd->intent.open.file->f_dentry == NULL)
+       if (nd->intent.open.file->f_path.dentry == NULL)
                 put_filp(nd->intent.open.file);
         else
                 fput(nd->intent.open.file);
@@ -999,7 +1015,7 @@ return_err:
   * Retry the whole path once, forcing real lookup requests
   * instead of relying on the dcache.
   */
-int fastcall link_path_walk(const char *name, struct nameidata *nd)
+static int fastcall link_path_walk(const char *name, struct nameidata *nd)
  {
         struct nameidata save = *nd;
         int result;
@@ -1023,7 +1039,7 @@ int fastcall link_path_walk(const char *name, struct nameidata *nd)
         return result;
  }
  
-int fastcall path_walk(const char * name, struct nameidata *nd)
+static int fastcall path_walk(const char * name, struct nameidata *nd)
  {
         current->total_link_count = 0;
         return link_path_walk(name, nd);
@@ -1138,7 +1154,7 @@ static int fastcall do_path_lookup(int dfd, const char *name,
                 if (!file)
                         goto out_fail;
  
-               dentry = file->f_dentry;
+               dentry = file->f_path.dentry;
  
                 retval = -ENOTDIR;
                 if (!S_ISDIR(dentry->d_inode->i_mode))
@@ -1148,19 +1164,17 @@ static int fastcall do_path_lookup(int dfd, const char *name,
                 if (retval)
                         goto fput_fail;
  
-               nd->mnt = mntget(file->f_vfsmnt);
+               nd->mnt = mntget(file->f_path.mnt);
                 nd->dentry = dget(dentry);
  
                 fput_light(file, fput_needed);
         }
-       current->total_link_count = 0;
-       retval = link_path_walk(name, nd);
+
+       retval = path_walk(name, nd);
  out:
-       if (likely(retval == 0)) {
-               if (unlikely(!audit_dummy_context() && nd && nd->dentry &&
+       if (unlikely(!retval && !audit_dummy_context() && nd->dentry &&
                                 nd->dentry->d_inode))
-               audit_inode(name, nd->dentry->d_inode);
-       }
+               audit_inode(name, nd->dentry);
  out_fail:
         return retval;
  
@@ -1175,6 +1189,37 @@ int fastcall path_lookup(const char *name, unsigned int flags,
         return do_path_lookup(AT_FDCWD, name, flags, nd);
  }
  
+/**
+ * vfs_path_lookup - lookup a file path relative to a dentry-vfsmount pair
+ * @dentry:  pointer to dentry of the base directory
+ * @mnt: pointer to vfs mount of the base directory
+ * @name: pointer to file name
+ * @flags: lookup flags
+ * @nd: pointer to nameidata
+ */
+int vfs_path_lookup(struct dentry *dentry, struct vfsmount *mnt,
+                   const char *name, unsigned int flags,
+                   struct nameidata *nd)
+{
+       int retval;
+
+       /* same as do_path_lookup */
+       nd->last_type = LAST_ROOT;
+       nd->flags = flags;
+       nd->depth = 0;
+
+       nd->mnt = mntget(mnt);
+       nd->dentry = dget(dentry);
+
+       retval = path_walk(name, nd);
+       if (unlikely(!retval && !audit_dummy_context() && nd->dentry &&
+                               nd->dentry->d_inode))
+               audit_inode(name, nd->dentry);
+
+       return retval;
+
+}
+
  static int __path_lookup_intent_open(int dfd, const char *name,
                 unsigned int lookup_flags, struct nameidata *nd,
                 int open_flags, int create_mode)
@@ -1243,22 +1288,14 @@ int __user_path_lookup_open(const char __user *name, unsigned int lookup_flags,
         return err;
  }
  
-/*
- * Restricted form of lookup. Doesn't follow links, single-component only,
- * needs parent already locked. Doesn't follow mounts.
- * SMP-safe.
- */
-static struct dentry * __lookup_hash(struct qstr *name, struct dentry * base, struct nameidata *nd)
+static struct dentry *__lookup_hash(struct qstr *name,
+               struct dentry *base, struct nameidata *nd)
  {
-       struct dentry * dentry;
+       struct dentry *dentry;
         struct inode *inode;
         int err;
  
         inode = base->d_inode;
-       err = permission(inode, MAY_EXEC, nd);
-       dentry = ERR_PTR(err);
-       if (err)
-               goto out;
  
         /*
          * See if the low-level filesystem might want
@@ -1287,48 +1324,91 @@ out:
         return dentry;
  }
  
+/*
+ * Restricted form of lookup. Doesn't follow links, single-component only,
+ * needs parent already locked. Doesn't follow mounts.
+ * SMP-safe.
+ */
  static struct dentry *lookup_hash(struct nameidata *nd)
  {
+       int err;
+
+       err = permission(nd->dentry->d_inode, MAY_EXEC, nd);
+       if (err)
+               return ERR_PTR(err);
         return __lookup_hash(&nd->last, nd->dentry, nd);
  }
  
-/* SMP-safe */
-struct dentry * lookup_one_len(const char * name, struct dentry * base, int len)
+static int __lookup_one_len(const char *name, struct qstr *this,
+               struct dentry *base, int len)
  {
         unsigned long hash;
-       struct qstr this;
         unsigned int c;
  
-       this.name = name;
-       this.len = len;
+       this->name = name;
+       this->len = len;
         if (!len)
-               goto access;
+               return -EACCES;
  
         hash = init_name_hash();
         while (len--) {
                 c = *(const unsigned char *)name++;
                 if (c == '/' || c == '\0')
-                       goto access;
+                       return -EACCES;
                 hash = partial_name_hash(c, hash);
         }
-       this.hash = end_name_hash(hash);
+       this->hash = end_name_hash(hash);
+       return 0;
+}
+
+/**
+ * lookup_one_len:  filesystem helper to lookup single pathname component
+ * @name:      pathname component to lookup
+ * @base:      base directory to lookup from
+ * @len:       maximum length @len should be interpreted to
+ *
+ * Note that this routine is purely a helper for filesystem useage and should
+ * not be called by generic code.  Also note that by using this function to
+ * nameidata argument is passed to the filesystem methods and a filesystem
+ * using this helper needs to be prepared for that.
+ */
+struct dentry *lookup_one_len(const char *name, struct dentry *base, int len)
+{
+       int err;
+       struct qstr this;
  
+       err = __lookup_one_len(name, &this, base, len);
+       if (err)
+               return ERR_PTR(err);
+
+       err = permission(base->d_inode, MAY_EXEC, NULL);
+       if (err)
+               return ERR_PTR(err);
         return __lookup_hash(&this, base, NULL);
-access:
-       return ERR_PTR(-EACCES);
  }
  
-/*
- *     namei()
+/**
+ * lookup_one_noperm - bad hack for sysfs
+ * @name:      pathname component to lookup
+ * @base:      base directory to lookup from
   *
- * is used by most simple commands to get the inode of a specified name.
- * Open, link etc use their own routines, but this is enough for things
- * like 'chmod' etc.
+ * This is a variant of lookup_one_len that doesn't perform any permission
+ * checks.   It's a horrible hack to work around the braindead sysfs
+ * architecture and should not be used anywhere else.
   *
- * namei exists in two versions: namei/lnamei. The only difference is
- * that namei follows links, while lnamei does not.
- * SMP-safe
+ * DON'T USE THIS FUNCTION EVER, thanks.
   */
+struct dentry *lookup_one_noperm(const char *name, struct dentry *base)
+{
+       int err;
+       struct qstr this;
+
+       err = __lookup_one_len(name, &this, base, strlen(name));
+       if (err)
+               return ERR_PTR(err);
+       return __lookup_hash(&this, base, NULL);
+}
+
  int fastcall __user_walk_fd(int dfd, const char __user *name, unsigned flags,
                             struct nameidata *nd)
  {
@@ -1389,7 +1469,7 @@ static int may_delete(struct inode *dir,struct dentry *victim,int isdir)
                 return -ENOENT;
  
         BUG_ON(victim->d_parent->d_inode != dir);
-       audit_inode_child(victim->d_name.name, victim->d_inode, dir);
+       audit_inode_child(victim->d_name.name, victim, dir);
  
         error = permission(dir,MAY_WRITE | MAY_EXEC, NULL);
         if (error)
@@ -1528,10 +1608,6 @@ int may_open(struct nameidata *nd, int acc_mode, int flag)
         if (S_ISDIR(inode->i_mode) && (flag & FMODE_WRITE))
                 return -EISDIR;
  
-       error = vfs_permission(nd, acc_mode);
-       if (error)
-               return error;
-
         /*
          * FIFO's, sockets and device files are special: they don't
          * actually live on the filesystem itself, and as such you
@@ -1546,6 +1622,10 @@ int may_open(struct nameidata *nd, int acc_mode, int flag)
                 flag &= ~O_TRUNC;
         } else if (IS_RDONLY(inode) && (flag & FMODE_WRITE))
                 return -EROFS;
+
+       error = vfs_permission(nd, acc_mode);
+       if (error)
+               return error;
         /*
          * An append-only file must be opened in append mode for writing.
          */
@@ -1558,7 +1638,7 @@ int may_open(struct nameidata *nd, int acc_mode, int flag)
  
         /* O_NOATIME can only be set by the owner or superuser */
         if (flag & O_NOATIME)
-               if (current->fsuid != inode->i_uid && !capable(CAP_FOWNER))
+               if (!is_owner_or_cap(inode))
                         return -EPERM;
  
         /*
@@ -1579,8 +1659,10 @@ int may_open(struct nameidata *nd, int acc_mode, int flag)
                 error = locks_verify_locked(inode);
                 if (!error) {
                         DQUOT_INIT(inode);
-                       
-                       error = do_truncate(dentry, 0, ATTR_MTIME|ATTR_CTIME, NULL);
+
+                       error = do_truncate(dentry, 0,
+                                           ATTR_MTIME|ATTR_CTIME|ATTR_OPEN,
+                                           NULL);
                 }
                 put_write_access(inode);
                 if (error)
@@ -1701,7 +1783,7 @@ do_last:
          * It already exists.
          */
         mutex_unlock(&dir->d_inode->i_mutex);
-       audit_inode_update(path.dentry->d_inode);
+       audit_inode(pathname, path.dentry);
  
         error = -EEXIST;
         if (flag & O_EXCL)
@@ -2480,7 +2562,7 @@ int vfs_rename(struct inode *old_dir, struct dentry *old_dentry,
         if (!error) {
                 const char *new_name = old_dentry->d_name.name;
                 fsnotify_move(old_dir, new_dir, old_name, new_name, is_dir,
-                             new_dentry->d_inode, old_dentry->d_inode);
+                             new_dentry->d_inode, old_dentry);
         }
         fsnotify_oldname_free(old_name);
  
@@ -2639,19 +2721,9 @@ static char *page_getlink(struct dentry * dentry, struct page **ppage)
         struct address_space *mapping = dentry->d_inode->i_mapping;
         page = read_mapping_page(mapping, 0, NULL);
         if (IS_ERR(page))
-               goto sync_fail;
-       wait_on_page_locked(page);
-       if (!PageUptodate(page))
-               goto async_fail;
+               return (char*)page;
         *ppage = page;
         return kmap(page);
-
-async_fail:
-       page_cache_release(page);
-       return ERR_PTR(-EIO);
-
-sync_fail:
-       return (char*)page;
  }
  
  int page_readlink(struct dentry *dentry, char __user *buffer, int buflen)
@@ -2688,52 +2760,29 @@ int __page_symlink(struct inode *inode, const char *symname, int len,
  {
         struct address_space *mapping = inode->i_mapping;
         struct page *page;
-       int err = -ENOMEM;
+       void *fsdata;
+       int err;
         char *kaddr;
  
  retry:
-       page = find_or_create_page(mapping, 0, gfp_mask);
-       if (!page)
-               goto fail;
-       err = mapping->a_ops->prepare_write(NULL, page, 0, len-1);
-       if (err == AOP_TRUNCATED_PAGE) {
-               page_cache_release(page);
-               goto retry;
-       }
+       err = pagecache_write_begin(NULL, mapping, 0, len-1,
+                               AOP_FLAG_UNINTERRUPTIBLE, &page, &fsdata);
         if (err)
-               goto fail_map;
+               goto fail;
+
         kaddr = kmap_atomic(page, KM_USER0);
         memcpy(kaddr, symname, len-1);
         kunmap_atomic(kaddr, KM_USER0);
-       err = mapping->a_ops->commit_write(NULL, page, 0, len-1);
-       if (err == AOP_TRUNCATED_PAGE) {
-               page_cache_release(page);
-               goto retry;
-       }
-       if (err)
-               goto fail_map;
-       /*
-        * Notice that we are _not_ going to block here - end of page is
-        * unmapped, so this will only try to map the rest of page, see
-        * that it is unmapped (typically even will not look into inode -
-        * ->i_size will be enough for everything) and zero it out.
-        * OTOH it's obviously correct and should make the page up-to-date.
-        */
-       if (!PageUptodate(page)) {
-               err = mapping->a_ops->readpage(NULL, page);
-               if (err != AOP_TRUNCATED_PAGE)
-                       wait_on_page_locked(page);
-       } else {
-               unlock_page(page);
-       }
-       page_cache_release(page);
+
+       err = pagecache_write_end(NULL, mapping, 0, len-1, len-1,
+                                                       page, fsdata);
         if (err < 0)
                 goto fail;
+       if (err < len-1)
+               goto retry;
+
         mark_inode_dirty(inode);
         return 0;
-fail_map:
-       unlock_page(page);
-       page_cache_release(page);
  fail:
         return err;
  }
@@ -2744,7 +2793,7 @@ int page_symlink(struct inode *inode, const char *symname, int len)
                         mapping_gfp_mask(inode->i_mapping));
  }
  
-struct inode_operations page_symlink_inode_operations = {
+const struct inode_operations page_symlink_inode_operations = {
         .readlink       = generic_readlink,
         .follow_link    = page_follow_link_light,
         .put_link       = page_put_link,
@@ -2765,8 +2814,8 @@ EXPORT_SYMBOL(__page_symlink);
  EXPORT_SYMBOL(page_symlink);
  EXPORT_SYMBOL(page_symlink_inode_operations);
  EXPORT_SYMBOL(path_lookup);
+EXPORT_SYMBOL(vfs_path_lookup);
  EXPORT_SYMBOL(path_release);
-EXPORT_SYMBOL(path_walk);
  EXPORT_SYMBOL(permission);
  EXPORT_SYMBOL(vfs_permission);
  EXPORT_SYMBOL(file_permission);