rk3168:support act8846 set sleep voltage

[firefly-linux-kernel-4.4.55.git] / mm / hugetlb.c
diff --git a/mm/hugetlb.c b/mm/hugetlb.c

index 6402458fee38ca5ba2109882e92ebbf63e97c787..037f077b986525796df3263ea118a24a7e4f7e4f 100644 (file)
--- a/mm/hugetlb.c
+++ b/mm/hugetlb.c
@@ -460,8 +460,10 @@ static struct page *dequeue_huge_page_vma(struct hstate *h,
         struct zonelist *zonelist;
         struct zone *zone;
         struct zoneref *z;
+       unsigned int cpuset_mems_cookie;
  
-       get_mems_allowed();
+retry_cpuset:
+       cpuset_mems_cookie = get_mems_allowed();
         zonelist = huge_zonelist(vma, address,
                                         htlb_alloc_mask, &mpol, &nodemask);
         /*
@@ -488,10 +490,15 @@ static struct page *dequeue_huge_page_vma(struct hstate *h,
                         }
                 }
         }
-err:
+
         mpol_cond_put(mpol);
-       put_mems_allowed();
+       if (unlikely(!put_mems_allowed(cpuset_mems_cookie) && !page))
+               goto retry_cpuset;
         return page;
+
+err:
+       mpol_cond_put(mpol);
+       return NULL;
  }
  
  static void update_and_free_page(struct hstate *h, struct page *page)
@@ -575,6 +582,7 @@ static void prep_compound_gigantic_page(struct page *page, unsigned long order)
         __SetPageHead(page);
         for (i = 1; i < nr_pages; i++, p = mem_map_next(p, page, i)) {
                 __SetPageTail(p);
+               set_page_count(p, 0);
                 p->first_page = page;
         }
  }
@@ -900,7 +908,6 @@ retry:
         h->resv_huge_pages += delta;
         ret = 0;
  
-       spin_unlock(&hugetlb_lock);
         /* Free the needed pages to the hugetlb pool */
         list_for_each_entry_safe(page, tmp, &surplus_list, lru) {
                 if ((--needed) < 0)
@@ -914,6 +921,7 @@ retry:
                 VM_BUG_ON(page_count(page));
                 enqueue_huge_page(h, page);
         }
+       spin_unlock(&hugetlb_lock);
  
         /* Free unnecessary surplus pages to the buddy allocator */
  free:
@@ -1111,6 +1119,14 @@ static void __init gather_bootmem_prealloc(void)
                 WARN_ON(page_count(page) != 1);
                 prep_compound_huge_page(page, h->order);
                 prep_new_huge_page(h, page, page_to_nid(page));
+               /*
+                * If we had gigantic hugepages allocated at boot time, we need
+                * to restore the 'stolen' pages to totalram_pages in order to
+                * fix confusing memory reports from free(1) and another
+                * side-effects, like CommitLimit going negative.
+                */
+               if (h->order > (MAX_ORDER - 1))
+                       totalram_pages += 1 << h->order;
         }
  }
  
@@ -2051,6 +2067,15 @@ static void hugetlb_vm_op_open(struct vm_area_struct *vma)
                 kref_get(&reservations->refs);
  }
  
+static void resv_map_put(struct vm_area_struct *vma)
+{
+       struct resv_map *reservations = vma_resv_map(vma);
+
+       if (!reservations)
+               return;
+       kref_put(&reservations->refs, resv_map_release);
+}
+
  static void hugetlb_vm_op_close(struct vm_area_struct *vma)
  {
         struct hstate *h = hstate_vma(vma);
@@ -2066,7 +2091,7 @@ static void hugetlb_vm_op_close(struct vm_area_struct *vma)
                 reserve = (end - start) -
                         region_count(&reservations->regions, start, end);
  
-               kref_put(&reservations->refs, resv_map_release);
+               resv_map_put(vma);
  
                 if (reserve) {
                         hugetlb_acct_memory(h, -reserve);
@@ -2276,6 +2301,22 @@ void unmap_hugepage_range(struct vm_area_struct *vma, unsigned long start,
  {
         mutex_lock(&vma->vm_file->f_mapping->i_mmap_mutex);
         __unmap_hugepage_range(vma, start, end, ref_page);
+       /*
+        * Clear this flag so that x86's huge_pmd_share page_table_shareable
+        * test will fail on a vma being torn down, and not grab a page table
+        * on its way out.  We're lucky that the flag has such an appropriate
+        * name, and can in fact be safely cleared here. We could clear it
+        * before the __unmap_hugepage_range above, but all that's necessary
+        * is to clear it before releasing the i_mmap_mutex below.
+        *
+        * This works because in the contexts this is called, the VMA is
+        * going to be destroyed. It is not vunerable to madvise(DONTNEED)
+        * because madvise is not supported on hugetlbfs. The same applies
+        * for direct IO. unmap_hugepage_range() is only being called just
+        * before free_pgtables() so clearing VM_MAYSHARE will not cause
+        * surprises later.
+        */
+       vma->vm_flags &= ~VM_MAYSHARE;
         mutex_unlock(&vma->vm_file->f_mapping->i_mmap_mutex);
  }
  
@@ -2389,7 +2430,6 @@ retry_avoidcopy:
                 if (outside_reserve) {
                         BUG_ON(huge_pte_none(pte));
                         if (unmap_ref_private(mm, vma, old_page, address)) {
-                               BUG_ON(page_count(old_page) != 1);
                                 BUG_ON(huge_pte_none(pte));
                                 spin_lock(&mm->page_table_lock);
                                 goto retry_avoidcopy;
@@ -2407,6 +2447,8 @@ retry_avoidcopy:
          * anon_vma prepared.
          */
         if (unlikely(anon_vma_prepare(vma))) {
+               page_cache_release(new_page);
+               page_cache_release(old_page);
                 /* Caller expects lock to be held */
                 spin_lock(&mm->page_table_lock);
                 return VM_FAULT_OOM;
@@ -2668,6 +2710,7 @@ int hugetlb_fault(struct mm_struct *mm, struct vm_area_struct *vma,
          * so no worry about deadlock.
          */
         page = pte_page(entry);
+       get_page(page);
         if (page != pagecache_page)
                 lock_page(page);
  
@@ -2699,6 +2742,7 @@ out_page_table_lock:
         }
         if (page != pagecache_page)
                 unlock_page(page);
+       put_page(page);
  
  out_mutex:
         mutex_unlock(&hugetlb_instantiation_mutex);
@@ -2825,9 +2869,14 @@ void hugetlb_change_protection(struct vm_area_struct *vma,
                 }
         }
         spin_unlock(&mm->page_table_lock);
-       mutex_unlock(&vma->vm_file->f_mapping->i_mmap_mutex);
-
+       /*
+        * Must flush TLB before releasing i_mmap_mutex: x86's huge_pmd_unshare
+        * may have cleared our pud entry and done put_page on the page table:
+        * once we release i_mmap_mutex, another task can do the final put_page
+        * and that page table be reused and filled with junk.
+        */
         flush_tlb_range(vma, start, end);
+       mutex_unlock(&vma->vm_file->f_mapping->i_mmap_mutex);
  }
  
  int hugetlb_reserve_pages(struct inode *inode,
@@ -2865,12 +2914,16 @@ int hugetlb_reserve_pages(struct inode *inode,
                 set_vma_resv_flags(vma, HPAGE_RESV_OWNER);
         }
  
-       if (chg < 0)
-               return chg;
+       if (chg < 0) {
+               ret = chg;
+               goto out_err;
+       }
  
         /* There must be enough filesystem quota for the mapping */
-       if (hugetlb_get_quota(inode->i_mapping, chg))
-               return -ENOSPC;
+       if (hugetlb_get_quota(inode->i_mapping, chg)) {
+               ret = -ENOSPC;
+               goto out_err;
+       }
  
         /*
          * Check enough hugepages are available for the reservation.
@@ -2879,7 +2932,7 @@ int hugetlb_reserve_pages(struct inode *inode,
         ret = hugetlb_acct_memory(h, chg);
         if (ret < 0) {
                 hugetlb_put_quota(inode->i_mapping, chg);
-               return ret;
+               goto out_err;
         }
  
         /*
@@ -2896,6 +2949,10 @@ int hugetlb_reserve_pages(struct inode *inode,
         if (!vma || vma->vm_flags & VM_MAYSHARE)
                 region_add(&inode->i_mapping->private_list, from, to);
         return 0;
+out_err:
+       if (vma)
+               resv_map_put(vma);
+       return ret;
  }
  
  void hugetlb_unreserve_pages(struct inode *inode, long offset, long freed)