Whamcloud - gitweb
LU-73 Make register_shrinker argument more visible.
[fs/lustre-release.git] / lustre / ptlrpc / sec_bulk.c
index c09cf0c..7243e8f 100644 (file)
@@ -26,7 +26,7 @@
  * GPL HEADER END
  */
 /*
- * Copyright  2008 Sun Microsystems, Inc. All rights reserved
+ * Copyright (c) 2007, 2010, Oracle and/or its affiliates. All rights reserved.
  * Use is subject to license terms.
  */
 /*
@@ -107,7 +107,7 @@ static struct ptlrpc_enc_page_pool {
         /*
          * in-pool pages bookkeeping
          */
-        spinlock_t       epp_lock;        /* protect following fields */
+        cfs_spinlock_t   epp_lock;        /* protect following fields */
         unsigned long    epp_total_pages; /* total pages in pools */
         unsigned long    epp_free_pages;  /* current pages available */
 
@@ -132,8 +132,8 @@ static struct ptlrpc_enc_page_pool {
 /*
  * memory shrinker
  */
-const int pools_shrinker_seeks = DEFAULT_SEEKS;
-static struct shrinker *pools_shrinker = NULL;
+const int pools_shrinker_seeks = CFS_DEFAULT_SEEKS;
+static struct cfs_shrinker *pools_shrinker = NULL;
 
 
 /*
@@ -144,7 +144,7 @@ int sptlrpc_proc_read_enc_pool(char *page, char **start, off_t off, int count,
 {
         int     rc;
 
-        spin_lock(&page_pools.epp_lock);
+        cfs_spin_lock(&page_pools.epp_lock);
 
         rc = snprintf(page, count,
                       "physical pages:          %lu\n"
@@ -166,7 +166,7 @@ int sptlrpc_proc_read_enc_pool(char *page, char **start, off_t off, int count,
                       "max waitqueue depth:     %u\n"
                       "max wait time:           "CFS_TIME_T"/%u\n"
                       ,
-                      num_physpages,
+                      cfs_num_physpages,
                       PAGES_PER_POOL,
                       page_pools.epp_max_pages,
                       page_pools.epp_max_pools,
@@ -183,10 +183,10 @@ int sptlrpc_proc_read_enc_pool(char *page, char **start, off_t off, int count,
                       page_pools.epp_st_missings,
                       page_pools.epp_st_lowfree,
                       page_pools.epp_st_max_wqlen,
-                      page_pools.epp_st_max_wait, HZ
+                      page_pools.epp_st_max_wait, CFS_HZ
                      );
 
-        spin_unlock(&page_pools.epp_lock);
+        cfs_spin_unlock(&page_pools.epp_lock);
         return rc;
 }
 
@@ -206,7 +206,7 @@ static void enc_pools_release_free_pages(long npages)
         page_pools.epp_total_pages -= npages;
 
         /* max pool index after the release */
-        p_idx_max1 = page_pools.epp_total_pages == 0 ? 0 :
+        p_idx_max1 = page_pools.epp_total_pages == 0 ? -1 :
                      ((page_pools.epp_total_pages - 1) / PAGES_PER_POOL);
 
         p_idx = page_pools.epp_free_pages / PAGES_PER_POOL;
@@ -236,50 +236,41 @@ static void enc_pools_release_free_pages(long npages)
 }
 
 /*
- * could be called frequently for query (@nr_to_scan == 0)
+ * could be called frequently for query (@nr_to_scan == 0).
+ * we try to keep at least PTLRPC_MAX_BRW_PAGES pages in the pool.
  */
-static int enc_pools_shrink(int nr_to_scan, unsigned int gfp_mask)
+static int enc_pools_shrink(SHRINKER_FIRST_ARG int nr_to_scan,
+                            unsigned int gfp_mask)
 {
-        unsigned long   ret;
-
-        spin_lock(&page_pools.epp_lock);
-
-        if (nr_to_scan > page_pools.epp_free_pages)
-                nr_to_scan = page_pools.epp_free_pages;
-
-        if (nr_to_scan > 0) {
-                enc_pools_release_free_pages(nr_to_scan);
-                CDEBUG(D_SEC, "released %d pages, %ld left\n",
-                       nr_to_scan, page_pools.epp_free_pages);
-
-                page_pools.epp_st_shrinks++;
-                page_pools.epp_last_shrink = cfs_time_current_sec();
-        }
-
-        /*
-         * try to keep at least PTLRPC_MAX_BRW_PAGES pages in the pool
-         */
-        if (page_pools.epp_free_pages <= PTLRPC_MAX_BRW_PAGES) {
-                ret = 0;
-                goto out_unlock;
+        if (unlikely(nr_to_scan != 0)) {
+                cfs_spin_lock(&page_pools.epp_lock);
+                nr_to_scan = min(nr_to_scan, (int) page_pools.epp_free_pages -
+                                             PTLRPC_MAX_BRW_PAGES);
+                if (nr_to_scan > 0) {
+                        enc_pools_release_free_pages(nr_to_scan);
+                        CDEBUG(D_SEC, "released %d pages, %ld left\n",
+                               nr_to_scan, page_pools.epp_free_pages);
+
+                        page_pools.epp_st_shrinks++;
+                        page_pools.epp_last_shrink = cfs_time_current_sec();
+                }
+                cfs_spin_unlock(&page_pools.epp_lock);
         }
 
         /*
-         * if no pool access for a long time, we consider it's fully idle
+         * if no pool access for a long time, we consider it's fully idle.
+         * a little race here is fine.
          */
-        if (cfs_time_current_sec() - page_pools.epp_last_access >
-            CACHE_QUIESCENT_PERIOD)
+        if (unlikely(cfs_time_current_sec() - page_pools.epp_last_access >
+                     CACHE_QUIESCENT_PERIOD)) {
+                cfs_spin_lock(&page_pools.epp_lock);
                 page_pools.epp_idle_idx = IDLE_IDX_MAX;
+                cfs_spin_unlock(&page_pools.epp_lock);
+        }
 
         LASSERT(page_pools.epp_idle_idx <= IDLE_IDX_MAX);
-        ret = (page_pools.epp_free_pages * page_pools.epp_idle_idx /
-               IDLE_IDX_MAX);
-        if (page_pools.epp_free_pages - ret < PTLRPC_MAX_BRW_PAGES)
-                ret = page_pools.epp_free_pages - PTLRPC_MAX_BRW_PAGES;
-
-out_unlock:
-        spin_unlock(&page_pools.epp_lock);
-        return ret;
+        return max((int) page_pools.epp_free_pages - PTLRPC_MAX_BRW_PAGES, 0) *
+               (IDLE_IDX_MAX - page_pools.epp_idle_idx) / IDLE_IDX_MAX;
 }
 
 static inline
@@ -328,8 +319,9 @@ static void enc_pools_insert(cfs_page_t ***pools, int npools, int npages)
         LASSERT(npages > 0);
         LASSERT(page_pools.epp_total_pages+npages <= page_pools.epp_max_pages);
         LASSERT(npages_to_npools(npages) == npools);
+        LASSERT(page_pools.epp_growing);
 
-        spin_lock(&page_pools.epp_lock);
+        cfs_spin_lock(&page_pools.epp_lock);
 
         /*
          * (1) fill all the free slots of current pools.
@@ -396,12 +388,12 @@ static void enc_pools_insert(cfs_page_t ***pools, int npools, int npages)
         CDEBUG(D_SEC, "add %d pages to total %lu\n", npages,
                page_pools.epp_total_pages);
 
-        spin_unlock(&page_pools.epp_lock);
+        cfs_spin_unlock(&page_pools.epp_lock);
 }
 
 static int enc_pools_add_pages(int npages)
 {
-        static DECLARE_MUTEX(sem_add_pages);
+        static CFS_DECLARE_MUTEX(sem_add_pages);
         cfs_page_t   ***pools;
         int             npools, alloced = 0;
         int             i, j, rc = -ENOMEM;
@@ -409,7 +401,7 @@ static int enc_pools_add_pages(int npages)
         if (npages < PTLRPC_MAX_BRW_PAGES)
                 npages = PTLRPC_MAX_BRW_PAGES;
 
-        down(&sem_add_pages);
+        cfs_down(&sem_add_pages);
 
         if (npages + page_pools.epp_total_pages > page_pools.epp_max_pages)
                 npages = page_pools.epp_max_pages - page_pools.epp_total_pages;
@@ -436,6 +428,7 @@ static int enc_pools_add_pages(int npages)
                         alloced++;
                 }
         }
+        LASSERT(alloced == npages);
 
         enc_pools_insert(pools, npools, npages);
         CDEBUG(D_SEC, "added %d pages into pools\n", npages);
@@ -450,7 +443,7 @@ out:
                 CERROR("Failed to allocate %d enc pages\n", npages);
         }
 
-        up(&sem_add_pages);
+        cfs_up(&sem_add_pages);
         return rc;
 }
 
@@ -521,7 +514,7 @@ int sptlrpc_enc_pool_get_pages(struct ptlrpc_bulk_desc *desc)
         if (desc->bd_enc_iov == NULL)
                 return -ENOMEM;
 
-        spin_lock(&page_pools.epp_lock);
+        cfs_spin_lock(&page_pools.epp_lock);
 
         page_pools.epp_st_access++;
 again:
@@ -537,9 +530,9 @@ again:
                 if (enc_pools_should_grow(desc->bd_iov_count, now)) {
                         page_pools.epp_growing = 1;
 
-                        spin_unlock(&page_pools.epp_lock);
+                        cfs_spin_unlock(&page_pools.epp_lock);
                         enc_pools_add_pages(page_pools.epp_pages_short / 2);
-                        spin_lock(&page_pools.epp_lock);
+                        cfs_spin_lock(&page_pools.epp_lock);
 
                         page_pools.epp_growing = 0;
 
@@ -550,15 +543,15 @@ again:
                                 page_pools.epp_st_max_wqlen =
                                                 page_pools.epp_waitqlen;
 
-                        set_current_state(CFS_TASK_UNINT);
+                        cfs_set_current_state(CFS_TASK_UNINT);
                         cfs_waitlink_init(&waitlink);
                         cfs_waitq_add(&page_pools.epp_waitq, &waitlink);
 
-                        spin_unlock(&page_pools.epp_lock);
+                        cfs_spin_unlock(&page_pools.epp_lock);
                         cfs_waitq_wait(&waitlink, CFS_TASK_UNINT);
                         cfs_waitq_del(&page_pools.epp_waitq, &waitlink);
                         LASSERT(page_pools.epp_waitqlen > 0);
-                        spin_lock(&page_pools.epp_lock);
+                        cfs_spin_lock(&page_pools.epp_lock);
                         page_pools.epp_waitqlen--;
                 }
 
@@ -610,7 +603,7 @@ again:
 
         page_pools.epp_last_access = cfs_time_current_sec();
 
-        spin_unlock(&page_pools.epp_lock);
+        cfs_spin_unlock(&page_pools.epp_lock);
         return 0;
 }
 EXPORT_SYMBOL(sptlrpc_enc_pool_get_pages);
@@ -625,7 +618,7 @@ void sptlrpc_enc_pool_put_pages(struct ptlrpc_bulk_desc *desc)
 
         LASSERT(desc->bd_iov_count > 0);
 
-        spin_lock(&page_pools.epp_lock);
+        cfs_spin_lock(&page_pools.epp_lock);
 
         p_idx = page_pools.epp_free_pages / PAGES_PER_POOL;
         g_idx = page_pools.epp_free_pages % PAGES_PER_POOL;
@@ -652,7 +645,7 @@ void sptlrpc_enc_pool_put_pages(struct ptlrpc_bulk_desc *desc)
 
         enc_pools_wakeup();
 
-        spin_unlock(&page_pools.epp_lock);
+        cfs_spin_unlock(&page_pools.epp_lock);
 
         OBD_FREE(desc->bd_enc_iov,
                  desc->bd_iov_count * sizeof(*desc->bd_enc_iov));
@@ -669,21 +662,21 @@ int sptlrpc_enc_pool_add_user(void)
 {
         int     need_grow = 0;
 
-        spin_lock(&page_pools.epp_lock);
+        cfs_spin_lock(&page_pools.epp_lock);
         if (page_pools.epp_growing == 0 && page_pools.epp_total_pages == 0) {
                 page_pools.epp_growing = 1;
                 need_grow = 1;
         }
-        spin_unlock(&page_pools.epp_lock);
+        cfs_spin_unlock(&page_pools.epp_lock);
 
         if (need_grow) {
                 enc_pools_add_pages(PTLRPC_MAX_BRW_PAGES +
                                     PTLRPC_MAX_BRW_PAGES);
 
-                spin_lock(&page_pools.epp_lock);
+                cfs_spin_lock(&page_pools.epp_lock);
                 page_pools.epp_growing = 0;
                 enc_pools_wakeup();
-                spin_unlock(&page_pools.epp_lock);
+                cfs_spin_unlock(&page_pools.epp_lock);
         }
         return 0;
 }
@@ -722,7 +715,7 @@ int sptlrpc_enc_pool_init(void)
          * maximum capacity is 1/8 of total physical memory.
          * is the 1/8 a good number?
          */
-        page_pools.epp_max_pages = num_physpages / 8;
+        page_pools.epp_max_pages = cfs_num_physpages / 8;
         page_pools.epp_max_pools = npages_to_npools(page_pools.epp_max_pages);
 
         cfs_waitq_init(&page_pools.epp_waitq);
@@ -735,7 +728,7 @@ int sptlrpc_enc_pool_init(void)
         page_pools.epp_last_shrink = cfs_time_current_sec();
         page_pools.epp_last_access = cfs_time_current_sec();
 
-        spin_lock_init(&page_pools.epp_lock);
+        cfs_spin_lock_init(&page_pools.epp_lock);
         page_pools.epp_total_pages = 0;
         page_pools.epp_free_pages = 0;
 
@@ -753,7 +746,8 @@ int sptlrpc_enc_pool_init(void)
         if (page_pools.epp_pools == NULL)
                 return -ENOMEM;
 
-        pools_shrinker = set_shrinker(pools_shrinker_seeks, enc_pools_shrink);
+        pools_shrinker = cfs_set_shrinker(pools_shrinker_seeks,
+                                          enc_pools_shrink);
         if (pools_shrinker == NULL) {
                 enc_pools_free();
                 return -ENOMEM;
@@ -770,7 +764,7 @@ void sptlrpc_enc_pool_fini(void)
         LASSERT(page_pools.epp_pools);
         LASSERT(page_pools.epp_total_pages == page_pools.epp_free_pages);
 
-        remove_shrinker(pools_shrinker);
+        cfs_remove_shrinker(pools_shrinker);
 
         npools = npages_to_npools(page_pools.epp_total_pages);
         cleaned = enc_pools_cleanup(page_pools.epp_pools, npools);
@@ -786,7 +780,7 @@ void sptlrpc_enc_pool_fini(void)
                       page_pools.epp_st_grow_fails,
                       page_pools.epp_st_shrinks, page_pools.epp_st_access,
                       page_pools.epp_st_missings, page_pools.epp_st_max_wqlen,
-                      page_pools.epp_st_max_wait, HZ);
+                      page_pools.epp_st_max_wait, CFS_HZ);
         }
 }
 
@@ -863,7 +857,7 @@ __u8 sptlrpc_get_hash_alg(const char *algname)
 }
 EXPORT_SYMBOL(sptlrpc_get_hash_alg);
 
-int bulk_sec_desc_unpack(struct lustre_msg *msg, int offset)
+int bulk_sec_desc_unpack(struct lustre_msg *msg, int offset, int swabbed)
 {
         struct ptlrpc_bulk_sec_desc *bsd;
         int                          size = msg->lm_buflens[offset];
@@ -874,7 +868,7 @@ int bulk_sec_desc_unpack(struct lustre_msg *msg, int offset)
                 return -EINVAL;
         }
 
-        if (lustre_msg_swabbed(msg)) {
+        if (swabbed) {
                 __swab32s(&bsd->bsd_nob);
         }
 
@@ -989,9 +983,9 @@ int sptlrpc_get_bulk_checksum(struct ptlrpc_bulk_desc *desc, __u8 alg,
         hashsize = ll_crypto_hash_digestsize(hdesc.tfm);
 
         for (i = 0; i < desc->bd_iov_count; i++) {
-                sl.page = desc->bd_iov[i].kiov_page;
-                sl.offset = desc->bd_iov[i].kiov_offset;
-                sl.length = desc->bd_iov[i].kiov_len;
+                sg_set_page(&sl, desc->bd_iov[i].kiov_page,
+                             desc->bd_iov[i].kiov_len,
+                             desc->bd_iov[i].kiov_offset & ~CFS_PAGE_MASK);
                 ll_crypto_hash_update(&hdesc, &sl, sl.length);
         }