mm, swap: remove swap slot cache (0ff67f99) · Commits · git / linux-net

include/linux/swap.h

+0 −3

Original line number	Diff line number	Diff line
		@@ -465,7 +465,6 @@ void free_pages_and_swap_cache(struct encoded_page **, int);
		extern atomic_long_t nr_swap_pages;
		extern long total_swap_pages;
		extern atomic_t nr_rotate_swap;
		extern bool has_usable_swap(void);

		/* Swap 50% full? Release swapcache more aggressively.. */
		static inline bool vm_swap_full(void)
		@@ -483,13 +482,11 @@ swp_entry_t folio_alloc_swap(struct folio *folio);
		bool folio_free_swap(struct folio *folio);
		void put_swap_folio(struct folio *folio, swp_entry_t entry);
		extern swp_entry_t get_swap_page_of_type(int);
		extern int get_swap_pages(int n, swp_entry_t swp_entries[], int order);
		extern int add_swap_count_continuation(swp_entry_t, gfp_t);
		extern void swap_shmem_alloc(swp_entry_t, int);
		extern int swap_duplicate(swp_entry_t);
		extern int swapcache_prepare(swp_entry_t entry, int nr);
		extern void swap_free_nr(swp_entry_t entry, int nr_pages);
		extern void swapcache_free_entries(swp_entry_t *entries, int n);
		extern void free_swap_and_cache_nr(swp_entry_t entry, int nr);
		int swap_type_of(dev_t device, sector_t offset);
		int find_first_swap(dev_t *device);

include/linux/swap_slots.h

deleted100644 → 0

+0 −28

Original line number	Diff line number	Diff line
		/* SPDX-License-Identifier: GPL-2.0 */
		#ifndef _LINUX_SWAP_SLOTS_H
		#define _LINUX_SWAP_SLOTS_H

		#include <linux/swap.h>
		#include <linux/spinlock.h>
		#include <linux/mutex.h>

		#define SWAP_SLOTS_CACHE_SIZE SWAP_BATCH
		#define THRESHOLD_ACTIVATE_SWAP_SLOTS_CACHE (5*SWAP_SLOTS_CACHE_SIZE)
		#define THRESHOLD_DEACTIVATE_SWAP_SLOTS_CACHE (2*SWAP_SLOTS_CACHE_SIZE)

		struct swap_slots_cache {
		bool lock_initialized;
		struct mutex alloc_lock; /* protects slots, nr, cur */
		swp_entry_t *slots;
		int nr;
		int cur;
		int n_ret;
		};

		void disable_swap_slots_cache_lock(void);
		void reenable_swap_slots_cache_unlock(void);
		void enable_swap_slots_cache(void);

		extern bool swap_slot_cache_enabled;

		#endif /* _LINUX_SWAP_SLOTS_H */

mm/Makefile

+1 −1

Original line number	Diff line number	Diff line
		@@ -75,7 +75,7 @@ ifdef CONFIG_MMU
		obj-$(CONFIG_ADVISE_SYSCALLS) += madvise.o
		endif

		obj-$(CONFIG_SWAP) += page_io.o swap_state.o swapfile.o swap_slots.o
		obj-$(CONFIG_SWAP) += page_io.o swap_state.o swapfile.o
		obj-$(CONFIG_ZSWAP) += zswap.o
		obj-$(CONFIG_HAS_DMA) += dmapool.o
		obj-$(CONFIG_HUGETLBFS) += hugetlb.o

mm/swap_slots.c

deleted100644 → 0

+0 −295

Original line number	Diff line number	Diff line
		// SPDX-License-Identifier: GPL-2.0
		/*
		* Manage cache of swap slots to be used for and returned from
		* swap.
		*
		* Copyright(c) 2016 Intel Corporation.
		*
		* Author: Tim Chen <tim.c.chen@linux.intel.com>
		*
		* We allocate the swap slots from the global pool and put
		* it into local per cpu caches. This has the advantage
		* of no needing to acquire the swap_info lock every time
		* we need a new slot.
		*
		* There is also opportunity to simply return the slot
		* to local caches without needing to acquire swap_info
		* lock. We do not reuse the returned slots directly but
		* move them back to the global pool in a batch. This
		* allows the slots to coalesce and reduce fragmentation.
		*
		* The swap entry allocated is marked with SWAP_HAS_CACHE
		* flag in map_count that prevents it from being allocated
		* again from the global pool.
		*
		* The swap slots cache is protected by a mutex instead of
		* a spin lock as when we search for slots with scan_swap_map,
		* we can possibly sleep.
		*/

		#include <linux/swap_slots.h>
		#include <linux/cpu.h>
		#include <linux/cpumask.h>
		#include <linux/slab.h>
		#include <linux/vmalloc.h>
		#include <linux/mutex.h>
		#include <linux/mm.h>

		static DEFINE_PER_CPU(struct swap_slots_cache, swp_slots);
		static bool swap_slot_cache_active;
		bool swap_slot_cache_enabled;
		static bool swap_slot_cache_initialized;
		static DEFINE_MUTEX(swap_slots_cache_mutex);
		/* Serialize swap slots cache enable/disable operations */
		static DEFINE_MUTEX(swap_slots_cache_enable_mutex);

		static void __drain_swap_slots_cache(void);

		#define use_swap_slot_cache (swap_slot_cache_active && swap_slot_cache_enabled)

		static void deactivate_swap_slots_cache(void)
		{
		mutex_lock(&swap_slots_cache_mutex);
		swap_slot_cache_active = false;
		__drain_swap_slots_cache();
		mutex_unlock(&swap_slots_cache_mutex);
		}

		static void reactivate_swap_slots_cache(void)
		{
		mutex_lock(&swap_slots_cache_mutex);
		swap_slot_cache_active = true;
		mutex_unlock(&swap_slots_cache_mutex);
		}

		/* Must not be called with cpu hot plug lock */
		void disable_swap_slots_cache_lock(void)
		{
		mutex_lock(&swap_slots_cache_enable_mutex);
		swap_slot_cache_enabled = false;
		if (swap_slot_cache_initialized) {
		/* serialize with cpu hotplug operations */
		cpus_read_lock();
		__drain_swap_slots_cache();
		cpus_read_unlock();
		}
		}

		static void __reenable_swap_slots_cache(void)
		{
		swap_slot_cache_enabled = has_usable_swap();
		}

		void reenable_swap_slots_cache_unlock(void)
		{
		__reenable_swap_slots_cache();
		mutex_unlock(&swap_slots_cache_enable_mutex);
		}

		static bool check_cache_active(void)
		{
		long pages;

		if (!swap_slot_cache_enabled)
		return false;

		pages = get_nr_swap_pages();
		if (!swap_slot_cache_active) {
		if (pages > num_online_cpus() *
		THRESHOLD_ACTIVATE_SWAP_SLOTS_CACHE)
		reactivate_swap_slots_cache();
		goto out;
		}

		/* if global pool of slot caches too low, deactivate cache */
		if (pages < num_online_cpus() * THRESHOLD_DEACTIVATE_SWAP_SLOTS_CACHE)
		deactivate_swap_slots_cache();
		out:
		return swap_slot_cache_active;
		}

		static int alloc_swap_slot_cache(unsigned int cpu)
		{
		struct swap_slots_cache *cache;
		swp_entry_t *slots;

		/*
		* Do allocation outside swap_slots_cache_mutex
		* as kvzalloc could trigger reclaim and folio_alloc_swap,
		* which can lock swap_slots_cache_mutex.
		*/
		slots = kvcalloc(SWAP_SLOTS_CACHE_SIZE, sizeof(swp_entry_t),
		GFP_KERNEL);
		if (!slots)
		return -ENOMEM;

		mutex_lock(&swap_slots_cache_mutex);
		cache = &per_cpu(swp_slots, cpu);
		if (cache->slots) {
		/* cache already allocated */
		mutex_unlock(&swap_slots_cache_mutex);

		kvfree(slots);

		return 0;
		}

		if (!cache->lock_initialized) {
		mutex_init(&cache->alloc_lock);
		cache->lock_initialized = true;
		}
		cache->nr = 0;
		cache->cur = 0;
		cache->n_ret = 0;
		/*
		* We initialized alloc_lock and free_lock earlier. We use
		* !cache->slots or !cache->slots_ret to know if it is safe to acquire
		* the corresponding lock and use the cache. Memory barrier below
		* ensures the assumption.
		*/
		mb();
		cache->slots = slots;
		mutex_unlock(&swap_slots_cache_mutex);
		return 0;
		}

		static void drain_slots_cache_cpu(unsigned int cpu, bool free_slots)
		{
		struct swap_slots_cache *cache;

		cache = &per_cpu(swp_slots, cpu);
		if (cache->slots) {
		mutex_lock(&cache->alloc_lock);
		swapcache_free_entries(cache->slots + cache->cur, cache->nr);
		cache->cur = 0;
		cache->nr = 0;
		if (free_slots && cache->slots) {
		kvfree(cache->slots);
		cache->slots = NULL;
		}
		mutex_unlock(&cache->alloc_lock);
		}
		}

		static void __drain_swap_slots_cache(void)
		{
		unsigned int cpu;

		/*
		* This function is called during
		* 1) swapoff, when we have to make sure no
		* left over slots are in cache when we remove
		* a swap device;
		* 2) disabling of swap slot cache, when we run low
		* on swap slots when allocating memory and need
		* to return swap slots to global pool.
		*
		* We cannot acquire cpu hot plug lock here as
		* this function can be invoked in the cpu
		* hot plug path:
		* cpu_up -> lock cpu_hotplug -> cpu hotplug state callback
		* -> memory allocation -> direct reclaim -> folio_alloc_swap
		* -> drain_swap_slots_cache
		*
		* Hence the loop over current online cpu below could miss cpu that
		* is being brought online but not yet marked as online.
		* That is okay as we do not schedule and run anything on a
		* cpu before it has been marked online. Hence, we will not
		* fill any swap slots in slots cache of such cpu.
		* There are no slots on such cpu that need to be drained.
		*/
		for_each_online_cpu(cpu)
		drain_slots_cache_cpu(cpu, false);
		}

		static int free_slot_cache(unsigned int cpu)
		{
		mutex_lock(&swap_slots_cache_mutex);
		drain_slots_cache_cpu(cpu, true);
		mutex_unlock(&swap_slots_cache_mutex);
		return 0;
		}

		void enable_swap_slots_cache(void)
		{
		mutex_lock(&swap_slots_cache_enable_mutex);
		if (!swap_slot_cache_initialized) {
		int ret;

		ret = cpuhp_setup_state(CPUHP_AP_ONLINE_DYN, "swap_slots_cache",
		alloc_swap_slot_cache, free_slot_cache);
		if (WARN_ONCE(ret < 0, "Cache allocation failed (%s), operating "
		"without swap slots cache.\n", __func__))
		goto out_unlock;

		swap_slot_cache_initialized = true;
		}

		__reenable_swap_slots_cache();
		out_unlock:
		mutex_unlock(&swap_slots_cache_enable_mutex);
		}

		/* called with swap slot cache's alloc lock held */
		static int refill_swap_slots_cache(struct swap_slots_cache *cache)
		{
		if (!use_swap_slot_cache)
		return 0;

		cache->cur = 0;
		if (swap_slot_cache_active)
		cache->nr = get_swap_pages(SWAP_SLOTS_CACHE_SIZE,
		cache->slots, 0);

		return cache->nr;
		}

		swp_entry_t folio_alloc_swap(struct folio *folio)
		{
		swp_entry_t entry;
		struct swap_slots_cache *cache;

		entry.val = 0;

		if (folio_test_large(folio)) {
		if (IS_ENABLED(CONFIG_THP_SWAP))
		get_swap_pages(1, &entry, folio_order(folio));
		goto out;
		}

		/*
		* Preemption is allowed here, because we may sleep
		* in refill_swap_slots_cache(). But it is safe, because
		* accesses to the per-CPU data structure are protected by the
		* mutex cache->alloc_lock.
		*
		* The alloc path here does not touch cache->slots_ret
		* so cache->free_lock is not taken.
		*/
		cache = raw_cpu_ptr(&swp_slots);

		if (likely(check_cache_active() && cache->slots)) {
		mutex_lock(&cache->alloc_lock);
		if (cache->slots) {
		repeat:
		if (cache->nr) {
		entry = cache->slots[cache->cur];
		cache->slots[cache->cur++].val = 0;
		cache->nr--;
		} else if (refill_swap_slots_cache(cache)) {
		goto repeat;
		}
		}
		mutex_unlock(&cache->alloc_lock);
		if (entry.val)
		goto out;
		}

		get_swap_pages(1, &entry, 0);
		out:
		if (mem_cgroup_try_charge_swap(folio, entry)) {
		put_swap_folio(folio, entry);
		entry.val = 0;
		}
		return entry;
		}

mm/swap_state.c

+1 −7

Original line number	Diff line number	Diff line
		@@ -20,7 +20,6 @@
		#include <linux/blkdev.h>
		#include <linux/migrate.h>
		#include <linux/vmalloc.h>
		#include <linux/swap_slots.h>
		#include <linux/huge_mm.h>
		#include <linux/shmem_fs.h>
		#include "internal.h"
		@@ -447,13 +446,8 @@ struct folio *__read_swap_cache_async(swp_entry_t entry, gfp_t gfp_mask,

		/*
		* Just skip read ahead for unused swap slot.
		* During swap_off when swap_slot_cache is disabled,
		* we have to handle the race between putting
		* swap entry in swap cache and marking swap slot
		* as SWAP_HAS_CACHE. That's done in later part of code or
		* else swap_off will be aborted if we return NULL.
		*/
		if (!swap_entry_swapped(si, entry) && swap_slot_cache_enabled)
		if (!swap_entry_swapped(si, entry))
		goto put_and_return;

		/*