Merge branch 'for-linus' of git://git.kernel.org/pub/scm/linux/kernel/git/mszeredi...
[safe/jmp/linux-2.6] / fs / fuse / dev.c
index c4a3d9b..9424796 100644 (file)
 #include <linux/pagemap.h>
 #include <linux/file.h>
 #include <linux/slab.h>
+#include <linux/pipe_fs_i.h>
+#include <linux/swap.h>
+#include <linux/splice.h>
 
 MODULE_ALIAS_MISCDEV(FUSE_MINOR);
+MODULE_ALIAS("devname:fuse");
 
 static struct kmem_cache *fuse_req_cachep;
 
@@ -46,6 +50,7 @@ struct fuse_req *fuse_request_alloc(void)
                fuse_request_init(req);
        return req;
 }
+EXPORT_SYMBOL_GPL(fuse_request_alloc);
 
 struct fuse_req *fuse_request_alloc_nofs(void)
 {
@@ -124,6 +129,7 @@ struct fuse_req *fuse_get_req(struct fuse_conn *fc)
        atomic_dec(&fc->num_waiting);
        return ERR_PTR(err);
 }
+EXPORT_SYMBOL_GPL(fuse_get_req);
 
 /*
  * Return request in fuse_file->reserved_req.  However that may
@@ -208,6 +214,7 @@ void fuse_put_request(struct fuse_conn *fc, struct fuse_req *req)
                        fuse_request_free(req);
        }
 }
+EXPORT_SYMBOL_GPL(fuse_put_request);
 
 static unsigned len_args(unsigned numargs, struct fuse_arg *args)
 {
@@ -247,7 +254,7 @@ static void queue_request(struct fuse_conn *fc, struct fuse_req *req)
 
 static void flush_bg_queue(struct fuse_conn *fc)
 {
-       while (fc->active_background < FUSE_MAX_BACKGROUND &&
+       while (fc->active_background < fc->max_background &&
               !list_empty(&fc->bg_queue)) {
                struct fuse_req *req;
 
@@ -277,14 +284,14 @@ __releases(&fc->lock)
        list_del(&req->intr_entry);
        req->state = FUSE_REQ_FINISHED;
        if (req->background) {
-               if (fc->num_background == FUSE_MAX_BACKGROUND) {
+               if (fc->num_background == fc->max_background) {
                        fc->blocked = 0;
                        wake_up_all(&fc->blocked_waitq);
                }
-               if (fc->num_background == FUSE_CONGESTION_THRESHOLD &&
-                   fc->connected) {
-                       clear_bdi_congested(&fc->bdi, READ);
-                       clear_bdi_congested(&fc->bdi, WRITE);
+               if (fc->num_background == fc->congestion_threshold &&
+                   fc->connected && fc->bdi_initialized) {
+                       clear_bdi_congested(&fc->bdi, BLK_RW_SYNC);
+                       clear_bdi_congested(&fc->bdi, BLK_RW_ASYNC);
                }
                fc->num_background--;
                fc->active_background--;
@@ -400,17 +407,19 @@ void fuse_request_send(struct fuse_conn *fc, struct fuse_req *req)
        }
        spin_unlock(&fc->lock);
 }
+EXPORT_SYMBOL_GPL(fuse_request_send);
 
 static void fuse_request_send_nowait_locked(struct fuse_conn *fc,
                                            struct fuse_req *req)
 {
        req->background = 1;
        fc->num_background++;
-       if (fc->num_background == FUSE_MAX_BACKGROUND)
+       if (fc->num_background == fc->max_background)
                fc->blocked = 1;
-       if (fc->num_background == FUSE_CONGESTION_THRESHOLD) {
-               set_bdi_congested(&fc->bdi, READ);
-               set_bdi_congested(&fc->bdi, WRITE);
+       if (fc->num_background == fc->congestion_threshold &&
+           fc->bdi_initialized) {
+               set_bdi_congested(&fc->bdi, BLK_RW_SYNC);
+               set_bdi_congested(&fc->bdi, BLK_RW_ASYNC);
        }
        list_add_tail(&req->list, &fc->bg_queue);
        flush_bg_queue(fc);
@@ -439,6 +448,7 @@ void fuse_request_send_background(struct fuse_conn *fc, struct fuse_req *req)
        req->isreply = 1;
        fuse_request_send_nowait(fc, req);
 }
+EXPORT_SYMBOL_GPL(fuse_request_send_background);
 
 /*
  * Called under fc->lock
@@ -492,6 +502,9 @@ struct fuse_copy_state {
        int write;
        struct fuse_req *req;
        const struct iovec *iov;
+       struct pipe_buffer *pipebufs;
+       struct pipe_buffer *currbuf;
+       struct pipe_inode_info *pipe;
        unsigned long nr_segs;
        unsigned long seglen;
        unsigned long addr;
@@ -499,16 +512,16 @@ struct fuse_copy_state {
        void *mapaddr;
        void *buf;
        unsigned len;
+       unsigned move_pages:1;
 };
 
 static void fuse_copy_init(struct fuse_copy_state *cs, struct fuse_conn *fc,
-                          int write, struct fuse_req *req,
+                          int write,
                           const struct iovec *iov, unsigned long nr_segs)
 {
        memset(cs, 0, sizeof(*cs));
        cs->fc = fc;
        cs->write = write;
-       cs->req = req;
        cs->iov = iov;
        cs->nr_segs = nr_segs;
 }
@@ -516,7 +529,18 @@ static void fuse_copy_init(struct fuse_copy_state *cs, struct fuse_conn *fc,
 /* Unmap and put previous page of userspace buffer */
 static void fuse_copy_finish(struct fuse_copy_state *cs)
 {
-       if (cs->mapaddr) {
+       if (cs->currbuf) {
+               struct pipe_buffer *buf = cs->currbuf;
+
+               if (!cs->write) {
+                       buf->ops->unmap(cs->pipe, buf, cs->mapaddr);
+               } else {
+                       kunmap_atomic(cs->mapaddr, KM_USER0);
+                       buf->len = PAGE_SIZE - cs->len;
+               }
+               cs->currbuf = NULL;
+               cs->mapaddr = NULL;
+       } else if (cs->mapaddr) {
                kunmap_atomic(cs->mapaddr, KM_USER0);
                if (cs->write) {
                        flush_dcache_page(cs->pg);
@@ -538,26 +562,61 @@ static int fuse_copy_fill(struct fuse_copy_state *cs)
 
        unlock_request(cs->fc, cs->req);
        fuse_copy_finish(cs);
-       if (!cs->seglen) {
-               BUG_ON(!cs->nr_segs);
-               cs->seglen = cs->iov[0].iov_len;
-               cs->addr = (unsigned long) cs->iov[0].iov_base;
-               cs->iov++;
-               cs->nr_segs--;
+       if (cs->pipebufs) {
+               struct pipe_buffer *buf = cs->pipebufs;
+
+               if (!cs->write) {
+                       err = buf->ops->confirm(cs->pipe, buf);
+                       if (err)
+                               return err;
+
+                       BUG_ON(!cs->nr_segs);
+                       cs->currbuf = buf;
+                       cs->mapaddr = buf->ops->map(cs->pipe, buf, 1);
+                       cs->len = buf->len;
+                       cs->buf = cs->mapaddr + buf->offset;
+                       cs->pipebufs++;
+                       cs->nr_segs--;
+               } else {
+                       struct page *page;
+
+                       if (cs->nr_segs == cs->pipe->buffers)
+                               return -EIO;
+
+                       page = alloc_page(GFP_HIGHUSER);
+                       if (!page)
+                               return -ENOMEM;
+
+                       buf->page = page;
+                       buf->offset = 0;
+                       buf->len = 0;
+
+                       cs->currbuf = buf;
+                       cs->mapaddr = kmap_atomic(page, KM_USER0);
+                       cs->buf = cs->mapaddr;
+                       cs->len = PAGE_SIZE;
+                       cs->pipebufs++;
+                       cs->nr_segs++;
+               }
+       } else {
+               if (!cs->seglen) {
+                       BUG_ON(!cs->nr_segs);
+                       cs->seglen = cs->iov[0].iov_len;
+                       cs->addr = (unsigned long) cs->iov[0].iov_base;
+                       cs->iov++;
+                       cs->nr_segs--;
+               }
+               err = get_user_pages_fast(cs->addr, 1, cs->write, &cs->pg);
+               if (err < 0)
+                       return err;
+               BUG_ON(err != 1);
+               offset = cs->addr % PAGE_SIZE;
+               cs->mapaddr = kmap_atomic(cs->pg, KM_USER0);
+               cs->buf = cs->mapaddr + offset;
+               cs->len = min(PAGE_SIZE - offset, cs->seglen);
+               cs->seglen -= cs->len;
+               cs->addr += cs->len;
        }
-       down_read(&current->mm->mmap_sem);
-       err = get_user_pages(current, current->mm, cs->addr, 1, cs->write, 0,
-                            &cs->pg, NULL);
-       up_read(&current->mm->mmap_sem);
-       if (err < 0)
-               return err;
-       BUG_ON(err != 1);
-       offset = cs->addr % PAGE_SIZE;
-       cs->mapaddr = kmap_atomic(cs->pg, KM_USER0);
-       cs->buf = cs->mapaddr + offset;
-       cs->len = min(PAGE_SIZE - offset, cs->seglen);
-       cs->seglen -= cs->len;
-       cs->addr += cs->len;
 
        return lock_request(cs->fc, cs->req);
 }
@@ -579,23 +638,178 @@ static int fuse_copy_do(struct fuse_copy_state *cs, void **val, unsigned *size)
        return ncpy;
 }
 
+static int fuse_check_page(struct page *page)
+{
+       if (page_mapcount(page) ||
+           page->mapping != NULL ||
+           page_count(page) != 1 ||
+           (page->flags & PAGE_FLAGS_CHECK_AT_PREP &
+            ~(1 << PG_locked |
+              1 << PG_referenced |
+              1 << PG_uptodate |
+              1 << PG_lru |
+              1 << PG_active |
+              1 << PG_reclaim))) {
+               printk(KERN_WARNING "fuse: trying to steal weird page\n");
+               printk(KERN_WARNING "  page=%p index=%li flags=%08lx, count=%i, mapcount=%i, mapping=%p\n", page, page->index, page->flags, page_count(page), page_mapcount(page), page->mapping);
+               return 1;
+       }
+       return 0;
+}
+
+static int fuse_try_move_page(struct fuse_copy_state *cs, struct page **pagep)
+{
+       int err;
+       struct page *oldpage = *pagep;
+       struct page *newpage;
+       struct pipe_buffer *buf = cs->pipebufs;
+       struct address_space *mapping;
+       pgoff_t index;
+
+       unlock_request(cs->fc, cs->req);
+       fuse_copy_finish(cs);
+
+       err = buf->ops->confirm(cs->pipe, buf);
+       if (err)
+               return err;
+
+       BUG_ON(!cs->nr_segs);
+       cs->currbuf = buf;
+       cs->len = buf->len;
+       cs->pipebufs++;
+       cs->nr_segs--;
+
+       if (cs->len != PAGE_SIZE)
+               goto out_fallback;
+
+       if (buf->ops->steal(cs->pipe, buf) != 0)
+               goto out_fallback;
+
+       newpage = buf->page;
+
+       if (WARN_ON(!PageUptodate(newpage)))
+               return -EIO;
+
+       ClearPageMappedToDisk(newpage);
+
+       if (fuse_check_page(newpage) != 0)
+               goto out_fallback_unlock;
+
+       mapping = oldpage->mapping;
+       index = oldpage->index;
+
+       /*
+        * This is a new and locked page, it shouldn't be mapped or
+        * have any special flags on it
+        */
+       if (WARN_ON(page_mapped(oldpage)))
+               goto out_fallback_unlock;
+       if (WARN_ON(page_has_private(oldpage)))
+               goto out_fallback_unlock;
+       if (WARN_ON(PageDirty(oldpage) || PageWriteback(oldpage)))
+               goto out_fallback_unlock;
+       if (WARN_ON(PageMlocked(oldpage)))
+               goto out_fallback_unlock;
+
+       remove_from_page_cache(oldpage);
+       page_cache_release(oldpage);
+
+       err = add_to_page_cache_locked(newpage, mapping, index, GFP_KERNEL);
+       if (err) {
+               printk(KERN_WARNING "fuse_try_move_page: failed to add page");
+               goto out_fallback_unlock;
+       }
+       page_cache_get(newpage);
+
+       if (!(buf->flags & PIPE_BUF_FLAG_LRU))
+               lru_cache_add_file(newpage);
+
+       err = 0;
+       spin_lock(&cs->fc->lock);
+       if (cs->req->aborted)
+               err = -ENOENT;
+       else
+               *pagep = newpage;
+       spin_unlock(&cs->fc->lock);
+
+       if (err) {
+               unlock_page(newpage);
+               page_cache_release(newpage);
+               return err;
+       }
+
+       unlock_page(oldpage);
+       page_cache_release(oldpage);
+       cs->len = 0;
+
+       return 0;
+
+out_fallback_unlock:
+       unlock_page(newpage);
+out_fallback:
+       cs->mapaddr = buf->ops->map(cs->pipe, buf, 1);
+       cs->buf = cs->mapaddr + buf->offset;
+
+       err = lock_request(cs->fc, cs->req);
+       if (err)
+               return err;
+
+       return 1;
+}
+
+static int fuse_ref_page(struct fuse_copy_state *cs, struct page *page,
+                        unsigned offset, unsigned count)
+{
+       struct pipe_buffer *buf;
+
+       if (cs->nr_segs == cs->pipe->buffers)
+               return -EIO;
+
+       unlock_request(cs->fc, cs->req);
+       fuse_copy_finish(cs);
+
+       buf = cs->pipebufs;
+       page_cache_get(page);
+       buf->page = page;
+       buf->offset = offset;
+       buf->len = count;
+
+       cs->pipebufs++;
+       cs->nr_segs++;
+       cs->len = 0;
+
+       return 0;
+}
+
 /*
  * Copy a page in the request to/from the userspace buffer.  Must be
  * done atomically
  */
-static int fuse_copy_page(struct fuse_copy_state *cs, struct page *page,
+static int fuse_copy_page(struct fuse_copy_state *cs, struct page **pagep,
                          unsigned offset, unsigned count, int zeroing)
 {
+       int err;
+       struct page *page = *pagep;
+
        if (page && zeroing && count < PAGE_SIZE) {
                void *mapaddr = kmap_atomic(page, KM_USER1);
                memset(mapaddr, 0, PAGE_SIZE);
                kunmap_atomic(mapaddr, KM_USER1);
        }
        while (count) {
-               if (!cs->len) {
-                       int err = fuse_copy_fill(cs);
-                       if (err)
-                               return err;
+               if (cs->write && cs->pipebufs && page) {
+                       return fuse_ref_page(cs, page, offset, count);
+               } else if (!cs->len) {
+                       if (cs->move_pages && page &&
+                           offset == 0 && count == PAGE_SIZE) {
+                               err = fuse_try_move_page(cs, pagep);
+                               if (err <= 0)
+                                       return err;
+                       } else {
+                               err = fuse_copy_fill(cs);
+                               if (err)
+                                       return err;
+                       }
                }
                if (page) {
                        void *mapaddr = kmap_atomic(page, KM_USER1);
@@ -620,8 +834,10 @@ static int fuse_copy_pages(struct fuse_copy_state *cs, unsigned nbytes,
        unsigned count = min(nbytes, (unsigned) PAGE_SIZE - offset);
 
        for (i = 0; i < req->num_pages && (nbytes || zeroing); i++) {
-               struct page *page = req->pages[i];
-               int err = fuse_copy_page(cs, page, offset, count, zeroing);
+               int err;
+
+               err = fuse_copy_page(cs, &req->pages[i], offset, count,
+                                    zeroing);
                if (err)
                        return err;
 
@@ -698,11 +914,10 @@ __acquires(&fc->lock)
  *
  * Called with fc->lock held, releases it
  */
-static int fuse_read_interrupt(struct fuse_conn *fc, struct fuse_req *req,
-                              const struct iovec *iov, unsigned long nr_segs)
+static int fuse_read_interrupt(struct fuse_conn *fc, struct fuse_copy_state *cs,
+                              size_t nbytes, struct fuse_req *req)
 __releases(&fc->lock)
 {
-       struct fuse_copy_state cs;
        struct fuse_in_header ih;
        struct fuse_interrupt_in arg;
        unsigned reqsize = sizeof(ih) + sizeof(arg);
@@ -718,14 +933,13 @@ __releases(&fc->lock)
        arg.unique = req->in.h.unique;
 
        spin_unlock(&fc->lock);
-       if (iov_length(iov, nr_segs) < reqsize)
+       if (nbytes < reqsize)
                return -EINVAL;
 
-       fuse_copy_init(&cs, fc, 1, NULL, iov, nr_segs);
-       err = fuse_copy_one(&cs, &ih, sizeof(ih));
+       err = fuse_copy_one(cs, &ih, sizeof(ih));
        if (!err)
-               err = fuse_copy_one(&cs, &arg, sizeof(arg));
-       fuse_copy_finish(&cs);
+               err = fuse_copy_one(cs, &arg, sizeof(arg));
+       fuse_copy_finish(cs);
 
        return err ? err : reqsize;
 }
@@ -739,18 +953,13 @@ __releases(&fc->lock)
  * request_end().  Otherwise add it to the processing list, and set
  * the 'sent' flag.
  */
-static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
-                             unsigned long nr_segs, loff_t pos)
+static ssize_t fuse_dev_do_read(struct fuse_conn *fc, struct file *file,
+                               struct fuse_copy_state *cs, size_t nbytes)
 {
        int err;
        struct fuse_req *req;
        struct fuse_in *in;
-       struct fuse_copy_state cs;
        unsigned reqsize;
-       struct file *file = iocb->ki_filp;
-       struct fuse_conn *fc = fuse_get_conn(file);
-       if (!fc)
-               return -EPERM;
 
  restart:
        spin_lock(&fc->lock);
@@ -770,7 +979,7 @@ static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
        if (!list_empty(&fc->interrupts)) {
                req = list_entry(fc->interrupts.next, struct fuse_req,
                                 intr_entry);
-               return fuse_read_interrupt(fc, req, iov, nr_segs);
+               return fuse_read_interrupt(fc, cs, nbytes, req);
        }
 
        req = list_entry(fc->pending.next, struct fuse_req, list);
@@ -780,7 +989,7 @@ static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
        in = &req->in;
        reqsize = in->h.len;
        /* If request is too large, reply with an error and restart the read */
-       if (iov_length(iov, nr_segs) < reqsize) {
+       if (nbytes < reqsize) {
                req->out.h.error = -EIO;
                /* SETXATTR is special, since it may contain too large data */
                if (in->h.opcode == FUSE_SETXATTR)
@@ -789,12 +998,12 @@ static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
                goto restart;
        }
        spin_unlock(&fc->lock);
-       fuse_copy_init(&cs, fc, 1, req, iov, nr_segs);
-       err = fuse_copy_one(&cs, &in->h, sizeof(in->h));
+       cs->req = req;
+       err = fuse_copy_one(cs, &in->h, sizeof(in->h));
        if (!err)
-               err = fuse_copy_args(&cs, in->numargs, in->argpages,
+               err = fuse_copy_args(cs, in->numargs, in->argpages,
                                     (struct fuse_arg *) in->args, 0);
-       fuse_copy_finish(&cs);
+       fuse_copy_finish(cs);
        spin_lock(&fc->lock);
        req->locked = 0;
        if (req->aborted) {
@@ -822,20 +1031,204 @@ static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
        return err;
 }
 
+static ssize_t fuse_dev_read(struct kiocb *iocb, const struct iovec *iov,
+                             unsigned long nr_segs, loff_t pos)
+{
+       struct fuse_copy_state cs;
+       struct file *file = iocb->ki_filp;
+       struct fuse_conn *fc = fuse_get_conn(file);
+       if (!fc)
+               return -EPERM;
+
+       fuse_copy_init(&cs, fc, 1, iov, nr_segs);
+
+       return fuse_dev_do_read(fc, file, &cs, iov_length(iov, nr_segs));
+}
+
+static int fuse_dev_pipe_buf_steal(struct pipe_inode_info *pipe,
+                                  struct pipe_buffer *buf)
+{
+       return 1;
+}
+
+static const struct pipe_buf_operations fuse_dev_pipe_buf_ops = {
+       .can_merge = 0,
+       .map = generic_pipe_buf_map,
+       .unmap = generic_pipe_buf_unmap,
+       .confirm = generic_pipe_buf_confirm,
+       .release = generic_pipe_buf_release,
+       .steal = fuse_dev_pipe_buf_steal,
+       .get = generic_pipe_buf_get,
+};
+
+static ssize_t fuse_dev_splice_read(struct file *in, loff_t *ppos,
+                                   struct pipe_inode_info *pipe,
+                                   size_t len, unsigned int flags)
+{
+       int ret;
+       int page_nr = 0;
+       int do_wakeup = 0;
+       struct pipe_buffer *bufs;
+       struct fuse_copy_state cs;
+       struct fuse_conn *fc = fuse_get_conn(in);
+       if (!fc)
+               return -EPERM;
+
+       bufs = kmalloc(pipe->buffers * sizeof (struct pipe_buffer), GFP_KERNEL);
+       if (!bufs)
+               return -ENOMEM;
+
+       fuse_copy_init(&cs, fc, 1, NULL, 0);
+       cs.pipebufs = bufs;
+       cs.pipe = pipe;
+       ret = fuse_dev_do_read(fc, in, &cs, len);
+       if (ret < 0)
+               goto out;
+
+       ret = 0;
+       pipe_lock(pipe);
+
+       if (!pipe->readers) {
+               send_sig(SIGPIPE, current, 0);
+               if (!ret)
+                       ret = -EPIPE;
+               goto out_unlock;
+       }
+
+       if (pipe->nrbufs + cs.nr_segs > pipe->buffers) {
+               ret = -EIO;
+               goto out_unlock;
+       }
+
+       while (page_nr < cs.nr_segs) {
+               int newbuf = (pipe->curbuf + pipe->nrbufs) & (pipe->buffers - 1);
+               struct pipe_buffer *buf = pipe->bufs + newbuf;
+
+               buf->page = bufs[page_nr].page;
+               buf->offset = bufs[page_nr].offset;
+               buf->len = bufs[page_nr].len;
+               buf->ops = &fuse_dev_pipe_buf_ops;
+
+               pipe->nrbufs++;
+               page_nr++;
+               ret += buf->len;
+
+               if (pipe->inode)
+                       do_wakeup = 1;
+       }
+
+out_unlock:
+       pipe_unlock(pipe);
+
+       if (do_wakeup) {
+               smp_mb();
+               if (waitqueue_active(&pipe->wait))
+                       wake_up_interruptible(&pipe->wait);
+               kill_fasync(&pipe->fasync_readers, SIGIO, POLL_IN);
+       }
+
+out:
+       for (; page_nr < cs.nr_segs; page_nr++)
+               page_cache_release(bufs[page_nr].page);
+
+       kfree(bufs);
+       return ret;
+}
+
 static int fuse_notify_poll(struct fuse_conn *fc, unsigned int size,
                            struct fuse_copy_state *cs)
 {
        struct fuse_notify_poll_wakeup_out outarg;
-       int err;
+       int err = -EINVAL;
 
        if (size != sizeof(outarg))
-               return -EINVAL;
+               goto err;
 
        err = fuse_copy_one(cs, &outarg, sizeof(outarg));
        if (err)
-               return err;
+               goto err;
 
+       fuse_copy_finish(cs);
        return fuse_notify_poll_wakeup(fc, &outarg);
+
+err:
+       fuse_copy_finish(cs);
+       return err;
+}
+
+static int fuse_notify_inval_inode(struct fuse_conn *fc, unsigned int size,
+                                  struct fuse_copy_state *cs)
+{
+       struct fuse_notify_inval_inode_out outarg;
+       int err = -EINVAL;
+
+       if (size != sizeof(outarg))
+               goto err;
+
+       err = fuse_copy_one(cs, &outarg, sizeof(outarg));
+       if (err)
+               goto err;
+       fuse_copy_finish(cs);
+
+       down_read(&fc->killsb);
+       err = -ENOENT;
+       if (fc->sb) {
+               err = fuse_reverse_inval_inode(fc->sb, outarg.ino,
+                                              outarg.off, outarg.len);
+       }
+       up_read(&fc->killsb);
+       return err;
+
+err:
+       fuse_copy_finish(cs);
+       return err;
+}
+
+static int fuse_notify_inval_entry(struct fuse_conn *fc, unsigned int size,
+                                  struct fuse_copy_state *cs)
+{
+       struct fuse_notify_inval_entry_out outarg;
+       int err = -ENOMEM;
+       char *buf;
+       struct qstr name;
+
+       buf = kzalloc(FUSE_NAME_MAX + 1, GFP_KERNEL);
+       if (!buf)
+               goto err;
+
+       err = -EINVAL;
+       if (size < sizeof(outarg))
+               goto err;
+
+       err = fuse_copy_one(cs, &outarg, sizeof(outarg));
+       if (err)
+               goto err;
+
+       err = -ENAMETOOLONG;
+       if (outarg.namelen > FUSE_NAME_MAX)
+               goto err;
+
+       name.name = buf;
+       name.len = outarg.namelen;
+       err = fuse_copy_one(cs, buf, outarg.namelen + 1);
+       if (err)
+               goto err;
+       fuse_copy_finish(cs);
+       buf[outarg.namelen] = 0;
+       name.hash = full_name_hash(name.name, name.len);
+
+       down_read(&fc->killsb);
+       err = -ENOENT;
+       if (fc->sb)
+               err = fuse_reverse_inval_entry(fc->sb, outarg.parent, &name);
+       up_read(&fc->killsb);
+       kfree(buf);
+       return err;
+
+err:
+       kfree(buf);
+       fuse_copy_finish(cs);
+       return err;
 }
 
 static int fuse_notify(struct fuse_conn *fc, enum fuse_notify_code code,
@@ -845,7 +1238,14 @@ static int fuse_notify(struct fuse_conn *fc, enum fuse_notify_code code,
        case FUSE_NOTIFY_POLL:
                return fuse_notify_poll(fc, size, cs);
 
+       case FUSE_NOTIFY_INVAL_INODE:
+               return fuse_notify_inval_inode(fc, size, cs);
+
+       case FUSE_NOTIFY_INVAL_ENTRY:
+               return fuse_notify_inval_entry(fc, size, cs);
+
        default:
+               fuse_copy_finish(cs);
                return -EINVAL;
        }
 }
@@ -894,23 +1294,17 @@ static int copy_out_args(struct fuse_copy_state *cs, struct fuse_out *out,
  * it from the list and copy the rest of the buffer to the request.
  * The request is finished by calling request_end()
  */
-static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
-                              unsigned long nr_segs, loff_t pos)
+static ssize_t fuse_dev_do_write(struct fuse_conn *fc,
+                                struct fuse_copy_state *cs, size_t nbytes)
 {
        int err;
-       unsigned nbytes = iov_length(iov, nr_segs);
        struct fuse_req *req;
        struct fuse_out_header oh;
-       struct fuse_copy_state cs;
-       struct fuse_conn *fc = fuse_get_conn(iocb->ki_filp);
-       if (!fc)
-               return -EPERM;
 
-       fuse_copy_init(&cs, fc, 0, NULL, iov, nr_segs);
        if (nbytes < sizeof(struct fuse_out_header))
                return -EINVAL;
 
-       err = fuse_copy_one(&cs, &oh, sizeof(oh));
+       err = fuse_copy_one(cs, &oh, sizeof(oh));
        if (err)
                goto err_finish;
 
@@ -923,8 +1317,7 @@ static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
         * and error contains notification code.
         */
        if (!oh.unique) {
-               err = fuse_notify(fc, oh.error, nbytes - sizeof(oh), &cs);
-               fuse_copy_finish(&cs);
+               err = fuse_notify(fc, oh.error, nbytes - sizeof(oh), cs);
                return err ? err : nbytes;
        }
 
@@ -943,7 +1336,7 @@ static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
 
        if (req->aborted) {
                spin_unlock(&fc->lock);
-               fuse_copy_finish(&cs);
+               fuse_copy_finish(cs);
                spin_lock(&fc->lock);
                request_end(fc, req);
                return -ENOENT;
@@ -960,7 +1353,7 @@ static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
                        queue_interrupt(fc, req);
 
                spin_unlock(&fc->lock);
-               fuse_copy_finish(&cs);
+               fuse_copy_finish(cs);
                return nbytes;
        }
 
@@ -968,11 +1361,13 @@ static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
        list_move(&req->list, &fc->io);
        req->out.h = oh;
        req->locked = 1;
-       cs.req = req;
+       cs->req = req;
+       if (!req->out.page_replace)
+               cs->move_pages = 0;
        spin_unlock(&fc->lock);
 
-       err = copy_out_args(&cs, &req->out, nbytes);
-       fuse_copy_finish(&cs);
+       err = copy_out_args(cs, &req->out, nbytes);
+       fuse_copy_finish(cs);
 
        spin_lock(&fc->lock);
        req->locked = 0;
@@ -988,10 +1383,101 @@ static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
  err_unlock:
        spin_unlock(&fc->lock);
  err_finish:
-       fuse_copy_finish(&cs);
+       fuse_copy_finish(cs);
        return err;
 }
 
+static ssize_t fuse_dev_write(struct kiocb *iocb, const struct iovec *iov,
+                             unsigned long nr_segs, loff_t pos)
+{
+       struct fuse_copy_state cs;
+       struct fuse_conn *fc = fuse_get_conn(iocb->ki_filp);
+       if (!fc)
+               return -EPERM;
+
+       fuse_copy_init(&cs, fc, 0, iov, nr_segs);
+
+       return fuse_dev_do_write(fc, &cs, iov_length(iov, nr_segs));
+}
+
+static ssize_t fuse_dev_splice_write(struct pipe_inode_info *pipe,
+                                    struct file *out, loff_t *ppos,
+                                    size_t len, unsigned int flags)
+{
+       unsigned nbuf;
+       unsigned idx;
+       struct pipe_buffer *bufs;
+       struct fuse_copy_state cs;
+       struct fuse_conn *fc;
+       size_t rem;
+       ssize_t ret;
+
+       fc = fuse_get_conn(out);
+       if (!fc)
+               return -EPERM;
+
+       bufs = kmalloc(pipe->buffers * sizeof (struct pipe_buffer), GFP_KERNEL);
+       if (!bufs)
+               return -ENOMEM;
+
+       pipe_lock(pipe);
+       nbuf = 0;
+       rem = 0;
+       for (idx = 0; idx < pipe->nrbufs && rem < len; idx++)
+               rem += pipe->bufs[(pipe->curbuf + idx) & (pipe->buffers - 1)].len;
+
+       ret = -EINVAL;
+       if (rem < len) {
+               pipe_unlock(pipe);
+               goto out;
+       }
+
+       rem = len;
+       while (rem) {
+               struct pipe_buffer *ibuf;
+               struct pipe_buffer *obuf;
+
+               BUG_ON(nbuf >= pipe->buffers);
+               BUG_ON(!pipe->nrbufs);
+               ibuf = &pipe->bufs[pipe->curbuf];
+               obuf = &bufs[nbuf];
+
+               if (rem >= ibuf->len) {
+                       *obuf = *ibuf;
+                       ibuf->ops = NULL;
+                       pipe->curbuf = (pipe->curbuf + 1) & (pipe->buffers - 1);
+                       pipe->nrbufs--;
+               } else {
+                       ibuf->ops->get(pipe, ibuf);
+                       *obuf = *ibuf;
+                       obuf->flags &= ~PIPE_BUF_FLAG_GIFT;
+                       obuf->len = rem;
+                       ibuf->offset += obuf->len;
+                       ibuf->len -= obuf->len;
+               }
+               nbuf++;
+               rem -= obuf->len;
+       }
+       pipe_unlock(pipe);
+
+       fuse_copy_init(&cs, fc, 0, NULL, nbuf);
+       cs.pipebufs = bufs;
+       cs.pipe = pipe;
+
+       if (flags & SPLICE_F_MOVE)
+               cs.move_pages = 1;
+
+       ret = fuse_dev_do_write(fc, &cs, len);
+
+       for (idx = 0; idx < nbuf; idx++) {
+               struct pipe_buffer *buf = &bufs[idx];
+               buf->ops->release(pipe, buf);
+       }
+out:
+       kfree(bufs);
+       return ret;
+}
+
 static unsigned fuse_dev_poll(struct file *file, poll_table *wait)
 {
        unsigned mask = POLLOUT | POLLWRNORM;
@@ -1100,8 +1586,9 @@ void fuse_abort_conn(struct fuse_conn *fc)
        }
        spin_unlock(&fc->lock);
 }
+EXPORT_SYMBOL_GPL(fuse_abort_conn);
 
-static int fuse_dev_release(struct inode *inode, struct file *file)
+int fuse_dev_release(struct inode *inode, struct file *file)
 {
        struct fuse_conn *fc = fuse_get_conn(file);
        if (fc) {
@@ -1115,6 +1602,7 @@ static int fuse_dev_release(struct inode *inode, struct file *file)
 
        return 0;
 }
+EXPORT_SYMBOL_GPL(fuse_dev_release);
 
 static int fuse_dev_fasync(int fd, struct file *file, int on)
 {
@@ -1131,12 +1619,15 @@ const struct file_operations fuse_dev_operations = {
        .llseek         = no_llseek,
        .read           = do_sync_read,
        .aio_read       = fuse_dev_read,
+       .splice_read    = fuse_dev_splice_read,
        .write          = do_sync_write,
        .aio_write      = fuse_dev_write,
+       .splice_write   = fuse_dev_splice_write,
        .poll           = fuse_dev_poll,
        .release        = fuse_dev_release,
        .fasync         = fuse_dev_fasync,
 };
+EXPORT_SYMBOL_GPL(fuse_dev_operations);
 
 static struct miscdevice fuse_miscdevice = {
        .minor = FUSE_MINOR,