ASoC: rockchip: spdif: drop owner assignment from platform_drivers

[firefly-linux-kernel-4.4.55.git] / mm / filemap.c
diff --git a/mm/filemap.c b/mm/filemap.c

index a8251a8d3457d28802164d6538c9226e98416f73..7905fe721aa8ab3db06c957c9f2cc63cea1fee5f 100644 (file)
--- a/mm/filemap.c
+++ b/mm/filemap.c
@@ -9,7 +9,7 @@
   * most "normal" filesystems (but you don't /have/ to use this:
   * the NFS filesystem used to do this differently, for example)
   */
-#include <linux/module.h>
+#include <linux/export.h>
  #include <linux/compiler.h>
  #include <linux/fs.h>
  #include <linux/uaccess.h>
@@ -29,14 +29,15 @@
  #include <linux/pagevec.h>
  #include <linux/blkdev.h>
  #include <linux/security.h>
-#include <linux/syscalls.h>
  #include <linux/cpuset.h>
  #include <linux/hardirq.h> /* for BUG_ON(!in_atomic()) only */
  #include <linux/memcontrol.h>
-#include <linux/mm_inline.h> /* for page_is_file_cache() */
  #include <linux/cleancache.h>
  #include "internal.h"
  
+#define CREATE_TRACE_POINTS
+#include <trace/events/filemap.h>
+
  /*
   * FIXME: remove all knowledge of the buffer layer from the core VM
   */
@@ -78,10 +79,7 @@
   *  ->i_mutex                  (generic_file_buffered_write)
   *    ->mmap_sem               (fault_in_pages_readable->do_page_fault)
   *
- *  ->i_mutex
- *    ->i_alloc_sem             (various)
- *
- *  inode_wb_list_lock
+ *  bdi->wb.list_lock
   *    sb_lock                  (fs/fs-writeback.c)
   *    ->mapping->tree_lock     (__sync_single_inode)
   *
@@ -99,15 +97,14 @@
   *    ->zone.lru_lock          (check_pte_range->isolate_lru_page)
   *    ->private_lock           (page_remove_rmap->set_page_dirty)
   *    ->tree_lock              (page_remove_rmap->set_page_dirty)
- *    inode_wb_list_lock       (page_remove_rmap->set_page_dirty)
+ *    bdi.wb->list_lock                (page_remove_rmap->set_page_dirty)
   *    ->inode->i_lock          (page_remove_rmap->set_page_dirty)
- *    inode_wb_list_lock       (zap_pte_range->set_page_dirty)
+ *    bdi.wb->list_lock                (zap_pte_range->set_page_dirty)
   *    ->inode->i_lock          (zap_pte_range->set_page_dirty)
   *    ->private_lock           (zap_pte_range->__set_page_dirty_buffers)
   *
- *  (code doesn't rely on that order, so you could switch it around)
- *  ->tasklist_lock             (memory_failure, collect_procs_ao)
- *    ->i_mmap_mutex
+ * ->i_mmap_mutex
+ *   ->tasklist_lock            (memory_failure, collect_procs_ao)
   */
  
  /*
@@ -119,6 +116,7 @@ void __delete_from_page_cache(struct page *page)
  {
         struct address_space *mapping = page->mapping;
  
+       trace_mm_filemap_delete_from_page_cache(page);
         /*
          * if we're uptodate, flush out into the cleancache, otherwise
          * invalidate any existing cleancache entries.  We can't leave
@@ -127,10 +125,11 @@ void __delete_from_page_cache(struct page *page)
         if (PageUptodate(page) && PageMappedToDisk(page))
                 cleancache_put_page(page);
         else
-               cleancache_flush_page(mapping, page);
+               cleancache_invalidate_page(mapping, page);
  
         radix_tree_delete(&mapping->page_tree, page->index);
         page->mapping = NULL;
+       /* Leave page->index set: truncation lookup relies upon it */
         mapping->nrpages--;
         __dec_zone_page_state(page, NR_FILE_PAGES);
         if (PageSwapBacked(page))
@@ -189,6 +188,17 @@ static int sleep_on_page_killable(void *word)
         return fatal_signal_pending(current) ? -EINTR : 0;
  }
  
+static int filemap_check_errors(struct address_space *mapping)
+{
+       int ret = 0;
+       /* Check for outstanding write errors */
+       if (test_and_clear_bit(AS_ENOSPC, &mapping->flags))
+               ret = -ENOSPC;
+       if (test_and_clear_bit(AS_EIO, &mapping->flags))
+               ret = -EIO;
+       return ret;
+}
+
  /**
   * __filemap_fdatawrite_range - start writeback on mapping dirty pages in range
   * @mapping:   address space structure to write
@@ -270,10 +280,10 @@ int filemap_fdatawait_range(struct address_space *mapping, loff_t start_byte,
         pgoff_t end = end_byte >> PAGE_CACHE_SHIFT;
         struct pagevec pvec;
         int nr_pages;
-       int ret = 0;
+       int ret2, ret = 0;
  
         if (end_byte < start_byte)
-               return 0;
+               goto out;
  
         pagevec_init(&pvec, 0);
         while ((index <= end) &&
@@ -296,12 +306,10 @@ int filemap_fdatawait_range(struct address_space *mapping, loff_t start_byte,
                 pagevec_release(&pvec);
                 cond_resched();
         }
-
-       /* Check for outstanding write errors */
-       if (test_and_clear_bit(AS_ENOSPC, &mapping->flags))
-               ret = -ENOSPC;
-       if (test_and_clear_bit(AS_EIO, &mapping->flags))
-               ret = -EIO;
+out:
+       ret2 = filemap_check_errors(mapping);
+       if (!ret)
+               ret = ret2;
  
         return ret;
  }
@@ -342,6 +350,8 @@ int filemap_write_and_wait(struct address_space *mapping)
                         if (!err)
                                 err = err2;
                 }
+       } else {
+               err = filemap_check_errors(mapping);
         }
         return err;
  }
@@ -373,6 +383,8 @@ int filemap_write_and_wait_range(struct address_space *mapping,
                         if (!err)
                                 err = err2;
                 }
+       } else {
+               err = filemap_check_errors(mapping);
         }
         return err;
  }
@@ -396,24 +408,11 @@ EXPORT_SYMBOL(filemap_write_and_wait_range);
  int replace_page_cache_page(struct page *old, struct page *new, gfp_t gfp_mask)
  {
         int error;
-       struct mem_cgroup *memcg = NULL;
  
         VM_BUG_ON(!PageLocked(old));
         VM_BUG_ON(!PageLocked(new));
         VM_BUG_ON(new->mapping);
  
-       /*
-        * This is not page migration, but prepare_migration and
-        * end_migration does enough work for charge replacement.
-        *
-        * In the longer term we probably want a specialized function
-        * for moving the charge from old to new in a more efficient
-        * manner.
-        */
-       error = mem_cgroup_prepare_migration(old, new, &memcg, gfp_mask);
-       if (error)
-               return error;
-
         error = radix_tree_preload(gfp_mask & ~__GFP_HIGHMEM);
         if (!error) {
                 struct address_space *mapping = old->mapping;
@@ -435,13 +434,12 @@ int replace_page_cache_page(struct page *old, struct page *new, gfp_t gfp_mask)
                 if (PageSwapBacked(new))
                         __inc_zone_page_state(new, NR_SHMEM);
                 spin_unlock_irq(&mapping->tree_lock);
+               /* mem_cgroup codes must not be called under tree_lock */
+               mem_cgroup_replace_page_cache(old, new);
                 radix_tree_preload_end();
                 if (freepage)
                         freepage(old);
                 page_cache_release(old);
-               mem_cgroup_end_migration(memcg, old, new, true);
-       } else {
-               mem_cgroup_end_migration(memcg, old, new, false);
         }
  
         return error;
@@ -464,6 +462,7 @@ int add_to_page_cache_locked(struct page *page, struct address_space *mapping,
         int error;
  
         VM_BUG_ON(!PageLocked(page));
+       VM_BUG_ON(PageSwapBacked(page));
  
         error = mem_cgroup_cache_charge(page, current->mm,
                                         gfp_mask & GFP_RECLAIM_MASK);
@@ -481,11 +480,11 @@ int add_to_page_cache_locked(struct page *page, struct address_space *mapping,
                 if (likely(!error)) {
                         mapping->nrpages++;
                         __inc_zone_page_state(page, NR_FILE_PAGES);
-                       if (PageSwapBacked(page))
-                               __inc_zone_page_state(page, NR_SHMEM);
                         spin_unlock_irq(&mapping->tree_lock);
+                       trace_mm_filemap_add_to_page_cache(page);
                 } else {
                         page->mapping = NULL;
+                       /* Leave page->index set: truncation relies upon it */
                         spin_unlock_irq(&mapping->tree_lock);
                         mem_cgroup_uncharge_cache_page(page);
                         page_cache_release(page);
@@ -503,22 +502,9 @@ int add_to_page_cache_lru(struct page *page, struct address_space *mapping,
  {
         int ret;
  
-       /*
-        * Splice_read and readahead add shmem/tmpfs pages into the page cache
-        * before shmem_readpage has a chance to mark them as SwapBacked: they
-        * need to go on the anon lru below, and mem_cgroup_cache_charge
-        * (called in add_to_page_cache) needs to know where they're going too.
-        */
-       if (mapping_cap_swap_backed(mapping))
-               SetPageSwapBacked(page);
-
         ret = add_to_page_cache(page, mapping, offset, gfp_mask);
-       if (ret == 0) {
-               if (page_is_file_cache(page))
-                       lru_cache_add_file(page);
-               else
-                       lru_cache_add_anon(page);
-       }
+       if (ret == 0)
+               lru_cache_add_file(page);
         return ret;
  }
  EXPORT_SYMBOL_GPL(add_to_page_cache_lru);
@@ -530,10 +516,13 @@ struct page *__page_cache_alloc(gfp_t gfp)
         struct page *page;
  
         if (cpuset_do_page_mem_spread()) {
-               get_mems_allowed();
-               n = cpuset_mem_spread_node();
-               page = alloc_pages_exact_node(n, gfp, 0);
-               put_mems_allowed();
+               unsigned int cpuset_mems_cookie;
+               do {
+                       cpuset_mems_cookie = get_mems_allowed();
+                       n = cpuset_mem_spread_node();
+                       page = alloc_pages_exact_node(n, gfp, 0);
+               } while (!put_mems_allowed(cpuset_mems_cookie) && !page);
+
                 return page;
         }
         return alloc_pages(gfp, 0);
@@ -715,9 +704,16 @@ repeat:
                 page = radix_tree_deref_slot(pagep);
                 if (unlikely(!page))
                         goto out;
-               if (radix_tree_deref_retry(page))
-                       goto repeat;
-
+               if (radix_tree_exception(page)) {
+                       if (radix_tree_deref_retry(page))
+                               goto repeat;
+                       /*
+                        * Otherwise, shmem/tmpfs must be storing a swap entry
+                        * here as an exceptional entry: so return it without
+                        * attempting to raise page count.
+                        */
+                       goto out;
+               }
                 if (!page_cache_get_speculative(page))
                         goto repeat;
  
@@ -754,7 +750,7 @@ struct page *find_lock_page(struct address_space *mapping, pgoff_t offset)
  
  repeat:
         page = find_get_page(mapping, offset);
-       if (page) {
+       if (page && !radix_tree_exception(page)) {
                 lock_page(page);
                 /* Has the page been truncated? */
                 if (unlikely(page->mapping != mapping)) {
@@ -834,50 +830,54 @@ EXPORT_SYMBOL(find_or_create_page);
  unsigned find_get_pages(struct address_space *mapping, pgoff_t start,
                             unsigned int nr_pages, struct page **pages)
  {
-       unsigned int i;
-       unsigned int ret;
-       unsigned int nr_found;
+       struct radix_tree_iter iter;
+       void **slot;
+       unsigned ret = 0;
+
+       if (unlikely(!nr_pages))
+               return 0;
  
         rcu_read_lock();
  restart:
-       nr_found = radix_tree_gang_lookup_slot(&mapping->page_tree,
-                               (void ***)pages, start, nr_pages);
-       ret = 0;
-       for (i = 0; i < nr_found; i++) {
+       radix_tree_for_each_slot(slot, &mapping->page_tree, &iter, start) {
                 struct page *page;
  repeat:
-               page = radix_tree_deref_slot((void **)pages[i]);
+               page = radix_tree_deref_slot(slot);
                 if (unlikely(!page))
                         continue;
  
-               /*
-                * This can only trigger when the entry at index 0 moves out
-                * of or back to the root: none yet gotten, safe to restart.
-                */
-               if (radix_tree_deref_retry(page)) {
-                       WARN_ON(start | i);
-                       goto restart;
+               if (radix_tree_exception(page)) {
+                       if (radix_tree_deref_retry(page)) {
+                               /*
+                                * Transient condition which can only trigger
+                                * when entry at index 0 moves out of or back
+                                * to root: none yet gotten, safe to restart.
+                                */
+                               WARN_ON(iter.index);
+                               goto restart;
+                       }
+                       /*
+                        * Otherwise, shmem/tmpfs must be storing a swap entry
+                        * here as an exceptional entry: so skip over it -
+                        * we only reach this from invalidate_mapping_pages().
+                        */
+                       continue;
                 }
  
                 if (!page_cache_get_speculative(page))
                         goto repeat;
  
                 /* Has the page moved? */
-               if (unlikely(page != *((void **)pages[i]))) {
+               if (unlikely(page != *slot)) {
                         page_cache_release(page);
                         goto repeat;
                 }
  
                 pages[ret] = page;
-               ret++;
+               if (++ret == nr_pages)
+                       break;
         }
  
-       /*
-        * If all entries were removed before we could secure them,
-        * try again, because callers stop trying once 0 is returned.
-        */
-       if (unlikely(!ret && nr_found))
-               goto restart;
         rcu_read_unlock();
         return ret;
  }
@@ -897,34 +897,45 @@ repeat:
  unsigned find_get_pages_contig(struct address_space *mapping, pgoff_t index,
                                unsigned int nr_pages, struct page **pages)
  {
-       unsigned int i;
-       unsigned int ret;
-       unsigned int nr_found;
+       struct radix_tree_iter iter;
+       void **slot;
+       unsigned int ret = 0;
+
+       if (unlikely(!nr_pages))
+               return 0;
  
         rcu_read_lock();
  restart:
-       nr_found = radix_tree_gang_lookup_slot(&mapping->page_tree,
-                               (void ***)pages, index, nr_pages);
-       ret = 0;
-       for (i = 0; i < nr_found; i++) {
+       radix_tree_for_each_contig(slot, &mapping->page_tree, &iter, index) {
                 struct page *page;
  repeat:
-               page = radix_tree_deref_slot((void **)pages[i]);
+               page = radix_tree_deref_slot(slot);
+               /* The hole, there no reason to continue */
                 if (unlikely(!page))
-                       continue;
+                       break;
  
-               /*
-                * This can only trigger when the entry at index 0 moves out
-                * of or back to the root: none yet gotten, safe to restart.
-                */
-               if (radix_tree_deref_retry(page))
-                       goto restart;
+               if (radix_tree_exception(page)) {
+                       if (radix_tree_deref_retry(page)) {
+                               /*
+                                * Transient condition which can only trigger
+                                * when entry at index 0 moves out of or back
+                                * to root: none yet gotten, safe to restart.
+                                */
+                               goto restart;
+                       }
+                       /*
+                        * Otherwise, shmem/tmpfs must be storing a swap entry
+                        * here as an exceptional entry: so stop looking for
+                        * contiguous pages.
+                        */
+                       break;
+               }
  
                 if (!page_cache_get_speculative(page))
                         goto repeat;
  
                 /* Has the page moved? */
-               if (unlikely(page != *((void **)pages[i]))) {
+               if (unlikely(page != *slot)) {
                         page_cache_release(page);
                         goto repeat;
                 }
@@ -934,14 +945,14 @@ repeat:
                  * otherwise we can get both false positives and false
                  * negatives, which is just confusing to the caller.
                  */
-               if (page->mapping == NULL || page->index != index) {
+               if (page->mapping == NULL || page->index != iter.index) {
                         page_cache_release(page);
                         break;
                 }
  
                 pages[ret] = page;
-               ret++;
-               index++;
+               if (++ret == nr_pages)
+                       break;
         }
         rcu_read_unlock();
         return ret;
@@ -962,48 +973,53 @@ EXPORT_SYMBOL(find_get_pages_contig);
  unsigned find_get_pages_tag(struct address_space *mapping, pgoff_t *index,
                         int tag, unsigned int nr_pages, struct page **pages)
  {
-       unsigned int i;
-       unsigned int ret;
-       unsigned int nr_found;
+       struct radix_tree_iter iter;
+       void **slot;
+       unsigned ret = 0;
+
+       if (unlikely(!nr_pages))
+               return 0;
  
         rcu_read_lock();
  restart:
-       nr_found = radix_tree_gang_lookup_tag_slot(&mapping->page_tree,
-                               (void ***)pages, *index, nr_pages, tag);
-       ret = 0;
-       for (i = 0; i < nr_found; i++) {
+       radix_tree_for_each_tagged(slot, &mapping->page_tree,
+                                  &iter, *index, tag) {
                 struct page *page;
  repeat:
-               page = radix_tree_deref_slot((void **)pages[i]);
+               page = radix_tree_deref_slot(slot);
                 if (unlikely(!page))
                         continue;
  
-               /*
-                * This can only trigger when the entry at index 0 moves out
-                * of or back to the root: none yet gotten, safe to restart.
-                */
-               if (radix_tree_deref_retry(page))
-                       goto restart;
+               if (radix_tree_exception(page)) {
+                       if (radix_tree_deref_retry(page)) {
+                               /*
+                                * Transient condition which can only trigger
+                                * when entry at index 0 moves out of or back
+                                * to root: none yet gotten, safe to restart.
+                                */
+                               goto restart;
+                       }
+                       /*
+                        * This function is never used on a shmem/tmpfs
+                        * mapping, so a swap entry won't be found here.
+                        */
+                       BUG();
+               }
  
                 if (!page_cache_get_speculative(page))
                         goto repeat;
  
                 /* Has the page moved? */
-               if (unlikely(page != *((void **)pages[i]))) {
+               if (unlikely(page != *slot)) {
                         page_cache_release(page);
                         goto repeat;
                 }
  
                 pages[ret] = page;
-               ret++;
+               if (++ret == nr_pages)
+                       break;
         }
  
-       /*
-        * If all entries were removed before we could secure them,
-        * try again, because callers stop trying once 0 is returned.
-        */
-       if (unlikely(!ret && nr_found))
-               goto restart;
         rcu_read_unlock();
  
         if (ret)
@@ -1311,10 +1327,10 @@ int file_read_actor(read_descriptor_t *desc, struct page *page,
          * taking the kmap.
          */
         if (!fault_in_pages_writeable(desc->arg.buf, size)) {
-               kaddr = kmap_atomic(page, KM_USER0);
+               kaddr = kmap_atomic(page);
                 left = __copy_to_user_inatomic(desc->arg.buf,
                                                 kaddr + offset, size);
-               kunmap_atomic(kaddr, KM_USER0);
+               kunmap_atomic(kaddr);
                 if (left == 0)
                         goto success;
         }
@@ -1393,15 +1409,12 @@ generic_file_aio_read(struct kiocb *iocb, const struct iovec *iov,
         unsigned long seg = 0;
         size_t count;
         loff_t *ppos = &iocb->ki_pos;
-       struct blk_plug plug;
  
         count = 0;
         retval = generic_segment_checks(iov, &nr_segs, &count, VERIFY_WRITE);
         if (retval)
                 return retval;
  
-       blk_start_plug(&plug);
-
         /* coalesce the iovecs and go direct-to-BIO for O_DIRECT */
         if (filp->f_flags & O_DIRECT) {
                 loff_t size;
@@ -1474,49 +1487,10 @@ generic_file_aio_read(struct kiocb *iocb, const struct iovec *iov,
                         break;
         }
  out:
-       blk_finish_plug(&plug);
         return retval;
  }
  EXPORT_SYMBOL(generic_file_aio_read);
  
-static ssize_t
-do_readahead(struct address_space *mapping, struct file *filp,
-            pgoff_t index, unsigned long nr)
-{
-       if (!mapping || !mapping->a_ops || !mapping->a_ops->readpage)
-               return -EINVAL;
-
-       force_page_cache_readahead(mapping, filp, index, nr);
-       return 0;
-}
-
-SYSCALL_DEFINE(readahead)(int fd, loff_t offset, size_t count)
-{
-       ssize_t ret;
-       struct file *file;
-
-       ret = -EBADF;
-       file = fget(fd);
-       if (file) {
-               if (file->f_mode & FMODE_READ) {
-                       struct address_space *mapping = file->f_mapping;
-                       pgoff_t start = offset >> PAGE_CACHE_SHIFT;
-                       pgoff_t end = (offset + count - 1) >> PAGE_CACHE_SHIFT;
-                       unsigned long len = end - start + 1;
-                       ret = do_readahead(mapping, file, start, len);
-               }
-               fput(file);
-       }
-       return ret;
-}
-#ifdef CONFIG_HAVE_SYSCALL_WRAPPERS
-asmlinkage long SyS_readahead(long fd, loff_t offset, long count)
-{
-       return SYSC_readahead((int) fd, offset, (size_t) count);
-}
-SYSCALL_ALIAS(sys_readahead, SyS_readahead);
-#endif
-
  #ifdef CONFIG_MMU
  /**
   * page_cache_read - adds requested page to the page cache if not already there
@@ -1651,13 +1625,13 @@ int filemap_fault(struct vm_area_struct *vma, struct vm_fault *vmf)
          * Do we have something in the page cache already?
          */
         page = find_get_page(mapping, offset);
-       if (likely(page)) {
+       if (likely(page) && !(vmf->flags & FAULT_FLAG_TRIED)) {
                 /*
                  * We found the page, so try async readahead before
                  * waiting for the lock.
                  */
                 do_async_mmap_readahead(vma, ra, file, page, offset);
-       } else {
+       } else if (!page) {
                 /* No page in the page cache at all */
                 do_sync_mmap_readahead(vma, ra, file, offset);
                 count_vm_event(PGMAJFAULT);
@@ -1752,8 +1726,37 @@ page_not_uptodate:
  }
  EXPORT_SYMBOL(filemap_fault);
  
+int filemap_page_mkwrite(struct vm_area_struct *vma, struct vm_fault *vmf)
+{
+       struct page *page = vmf->page;
+       struct inode *inode = file_inode(vma->vm_file);
+       int ret = VM_FAULT_LOCKED;
+
+       sb_start_pagefault(inode->i_sb);
+       file_update_time(vma->vm_file);
+       lock_page(page);
+       if (page->mapping != inode->i_mapping) {
+               unlock_page(page);
+               ret = VM_FAULT_NOPAGE;
+               goto out;
+       }
+       /*
+        * We mark the page dirty already here so that when freeze is in
+        * progress, we are guaranteed that writeback during freezing will
+        * see the dirty page and writeprotect it again.
+        */
+       set_page_dirty(page);
+       wait_for_stable_page(page);
+out:
+       sb_end_pagefault(inode->i_sb);
+       return ret;
+}
+EXPORT_SYMBOL(filemap_page_mkwrite);
+
  const struct vm_operations_struct generic_file_vm_ops = {
         .fault          = filemap_fault,
+       .page_mkwrite   = filemap_page_mkwrite,
+       .remap_pages    = generic_file_remap_pages,
  };
  
  /* This is used for a general mmap of a disk file */
@@ -1766,7 +1769,6 @@ int generic_file_mmap(struct file * file, struct vm_area_struct * vma)
                 return -ENOEXEC;
         file_accessed(file);
         vma->vm_ops = &generic_file_vm_ops;
-       vma->vm_flags |= VM_CAN_NONLINEAR;
         return 0;
  }
  
@@ -1795,7 +1797,7 @@ EXPORT_SYMBOL(generic_file_readonly_mmap);
  
  static struct page *__read_cache_page(struct address_space *mapping,
                                 pgoff_t index,
-                               int (*filler)(void *,struct page*),
+                               int (*filler)(void *, struct page *),
                                 void *data,
                                 gfp_t gfp)
  {
@@ -1807,7 +1809,7 @@ repeat:
                 page = __page_cache_alloc(gfp | __GFP_COLD);
                 if (!page)
                         return ERR_PTR(-ENOMEM);
-               err = add_to_page_cache_lru(page, mapping, index, GFP_KERNEL);
+               err = add_to_page_cache_lru(page, mapping, index, gfp);
                 if (unlikely(err)) {
                         page_cache_release(page);
                         if (err == -EEXIST)
@@ -1826,7 +1828,7 @@ repeat:
  
  static struct page *do_read_cache_page(struct address_space *mapping,
                                 pgoff_t index,
-                               int (*filler)(void *,struct page*),
+                               int (*filler)(void *, struct page *),
                                 void *data,
                                 gfp_t gfp)
  
@@ -1866,7 +1868,7 @@ out:
   * @mapping:   the page's address_space
   * @index:     the page index
   * @filler:    function to perform the read
- * @data:      destination for read data
+ * @data:      first arg to filler(data, page) function, often left as NULL
   *
   * Same as read_cache_page, but don't wait for page to become unlocked
   * after submitting it to the filler.
@@ -1878,7 +1880,7 @@ out:
   */
  struct page *read_cache_page_async(struct address_space *mapping,
                                 pgoff_t index,
-                               int (*filler)(void *,struct page*),
+                               int (*filler)(void *, struct page *),
                                 void *data)
  {
         return do_read_cache_page(mapping, index, filler, data, mapping_gfp_mask(mapping));
@@ -1904,10 +1906,7 @@ static struct page *wait_on_page_read(struct page *page)
   * @gfp:       the page allocator flags to use if allocating
   *
   * This is the same as "read_mapping_page(mapping, index, NULL)", but with
- * any new page allocations done using the specified allocation flags. Note
- * that the Radix tree operations will still use GFP_KERNEL, so you can't
- * expect to do this atomically or anything like that - but you can pass in
- * other page requirements.
+ * any new page allocations done using the specified allocation flags.
   *
   * If the page does not get brought uptodate, return -EIO.
   */
@@ -1926,7 +1925,7 @@ EXPORT_SYMBOL(read_cache_page_gfp);
   * @mapping:   the page's address_space
   * @index:     the page index
   * @filler:    function to perform the read
- * @data:      destination for read data
+ * @data:      first arg to filler(data, page) function, often left as NULL
   *
   * Read into the page cache. If a page already exists, and PageUptodate() is
   * not set, try to fill the page then wait for it to become unlocked.
@@ -1935,78 +1934,13 @@ EXPORT_SYMBOL(read_cache_page_gfp);
   */
  struct page *read_cache_page(struct address_space *mapping,
                                 pgoff_t index,
-                               int (*filler)(void *,struct page*),
+                               int (*filler)(void *, struct page *),
                                 void *data)
  {
         return wait_on_page_read(read_cache_page_async(mapping, index, filler, data));
  }
  EXPORT_SYMBOL(read_cache_page);
  
-/*
- * The logic we want is
- *
- *     if suid or (sgid and xgrp)
- *             remove privs
- */
-int should_remove_suid(struct dentry *dentry)
-{
-       mode_t mode = dentry->d_inode->i_mode;
-       int kill = 0;
-
-       /* suid always must be killed */
-       if (unlikely(mode & S_ISUID))
-               kill = ATTR_KILL_SUID;
-
-       /*
-        * sgid without any exec bits is just a mandatory locking mark; leave
-        * it alone.  If some exec bits are set, it's a real sgid; kill it.
-        */
-       if (unlikely((mode & S_ISGID) && (mode & S_IXGRP)))
-               kill |= ATTR_KILL_SGID;
-
-       if (unlikely(kill && !capable(CAP_FSETID) && S_ISREG(mode)))
-               return kill;
-
-       return 0;
-}
-EXPORT_SYMBOL(should_remove_suid);
-
-static int __remove_suid(struct dentry *dentry, int kill)
-{
-       struct iattr newattrs;
-
-       newattrs.ia_valid = ATTR_FORCE | kill;
-       return notify_change(dentry, &newattrs);
-}
-
-int file_remove_suid(struct file *file)
-{
-       struct dentry *dentry = file->f_path.dentry;
-       struct inode *inode = dentry->d_inode;
-       int killsuid;
-       int killpriv;
-       int error = 0;
-
-       /* Fast path for nothing security related */
-       if (IS_NOSEC(inode))
-               return 0;
-
-       killsuid = should_remove_suid(dentry);
-       killpriv = security_inode_need_killpriv(dentry);
-
-       if (killpriv < 0)
-               return killpriv;
-       if (killpriv)
-               error = security_inode_killpriv(dentry);
-       if (!error && killsuid)
-               error = __remove_suid(dentry, killsuid);
-       if (!error && (inode->i_sb->s_flags & MS_NOSEC))
-               inode->i_flags |= S_NOSEC;
-
-       return error;
-}
-EXPORT_SYMBOL(file_remove_suid);
-
  static size_t __iovec_copy_from_user_inatomic(char *vaddr,
                         const struct iovec *iov, size_t base, size_t bytes)
  {
@@ -2041,7 +1975,7 @@ size_t iov_iter_copy_from_user_atomic(struct page *page,
         size_t copied;
  
         BUG_ON(!in_atomic());
-       kaddr = kmap_atomic(page, KM_USER0);
+       kaddr = kmap_atomic(page);
         if (likely(i->nr_segs == 1)) {
                 int left;
                 char __user *buf = i->iov->iov_base + i->iov_offset;
@@ -2051,7 +1985,7 @@ size_t iov_iter_copy_from_user_atomic(struct page *page,
                 copied = __iovec_copy_from_user_inatomic(kaddr + offset,
                                                 i->iov, i->iov_offset, bytes);
         }
-       kunmap_atomic(kaddr, KM_USER0);
+       kunmap_atomic(kaddr);
  
         return copied;
  }
@@ -2094,6 +2028,7 @@ void iov_iter_advance(struct iov_iter *i, size_t bytes)
         } else {
                 const struct iovec *iov = i->iov;
                 size_t base = i->iov_offset;
+               unsigned long nr_segs = i->nr_segs;
  
                 /*
                  * The !iov->iov_len check ensures we skip over unlikely
@@ -2109,11 +2044,13 @@ void iov_iter_advance(struct iov_iter *i, size_t bytes)
                         base += copy;
                         if (iov->iov_len == base) {
                                 iov++;
+                               nr_segs--;
                                 base = 0;
                         }
                 }
                 i->iov = iov;
                 i->iov_offset = base;
+               i->nr_segs = nr_segs;
         }
  }
  EXPORT_SYMBOL(iov_iter_advance);
@@ -2138,7 +2075,7 @@ EXPORT_SYMBOL(iov_iter_fault_in_readable);
  /*
   * Return the count of just the current iov_iter segment.
   */
-size_t iov_iter_single_seg_count(struct iov_iter *i)
+size_t iov_iter_single_seg_count(const struct iov_iter *i)
  {
         const struct iovec *iov = i->iov;
         if (i->nr_segs == 1)
@@ -2330,8 +2267,13 @@ struct page *grab_cache_page_write_begin(struct address_space *mapping,
                                         pgoff_t index, unsigned flags)
  {
         int status;
+       gfp_t gfp_mask;
         struct page *page;
         gfp_t gfp_notmask = 0;
+
+       gfp_mask = mapping_gfp_mask(mapping);
+       if (mapping_cap_account_dirty(mapping))
+               gfp_mask |= __GFP_WRITE;
         if (flags & AOP_FLAG_NOFS)
                 gfp_notmask = __GFP_FS;
  repeat:
@@ -2339,7 +2281,7 @@ repeat:
         if (page)
                 goto found;
  
-       page = __page_cache_alloc(mapping_gfp_mask(mapping) & ~gfp_notmask);
+       page = __page_cache_alloc(gfp_mask & ~gfp_notmask);
         if (!page)
                 return NULL;
         status = add_to_page_cache_lru(page, mapping, index,
@@ -2351,7 +2293,7 @@ repeat:
                 return NULL;
         }
  found:
-       wait_on_page_writeback(page);
+       wait_for_stable_page(page);
         return page;
  }
  EXPORT_SYMBOL(grab_cache_page_write_begin);
@@ -2383,7 +2325,6 @@ static ssize_t generic_perform_write(struct file *file,
                                                 iov_iter_count(i));
  
  again:
-
                 /*
                  * Bring in the user page that we will copy from _first_.
                  * Otherwise there's a nasty deadlock on copying from the
@@ -2439,7 +2380,10 @@ again:
                 written += copied;
  
                 balance_dirty_pages_ratelimited(mapping);
-
+               if (fatal_signal_pending(current)) {
+                       status = -EINTR;
+                       break;
+               }
         } while (iov_iter_count(i));
  
         return written ? written : status;
@@ -2505,8 +2449,6 @@ ssize_t __generic_file_aio_write(struct kiocb *iocb, const struct iovec *iov,
         count = ocount;
         pos = *ppos;
  
-       vfs_check_frozen(inode->i_sb, SB_FREEZE_WRITE);
-
         /* We can write back this queue in page reclaim */
         current->backing_dev_info = mapping->backing_dev_info;
         written = 0;
@@ -2522,7 +2464,9 @@ ssize_t __generic_file_aio_write(struct kiocb *iocb, const struct iovec *iov,
         if (err)
                 goto out;
  
-       file_update_time(file);
+       err = file_update_time(file);
+       if (err)
+               goto out;
  
         /* coalesce the iovecs and go direct-to-BIO for O_DIRECT */
         if (unlikely(file->f_flags & O_DIRECT)) {
@@ -2598,13 +2542,11 @@ ssize_t generic_file_aio_write(struct kiocb *iocb, const struct iovec *iov,
  {
         struct file *file = iocb->ki_filp;
         struct inode *inode = file->f_mapping->host;
-       struct blk_plug plug;
         ssize_t ret;
  
         BUG_ON(iocb->ki_pos != pos);
  
         mutex_lock(&inode->i_mutex);
-       blk_start_plug(&plug);
         ret = __generic_file_aio_write(iocb, iov, nr_segs, &iocb->ki_pos);
         mutex_unlock(&inode->i_mutex);
  
@@ -2615,7 +2557,6 @@ ssize_t generic_file_aio_write(struct kiocb *iocb, const struct iovec *iov,
                 if (err < 0 && ret > 0)
                         ret = err;
         }
-       blk_finish_plug(&plug);
         return ret;
  }
  EXPORT_SYMBOL(generic_file_aio_write);