* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 10:40 ` [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods Baoquan He
@ 2026-03-02 11:11 ` Barry Song
2026-03-02 14:47 ` Baoquan He
2026-03-02 19:28 ` Chris Li
2026-03-02 12:20 ` YoungJun Park
` (3 subsequent siblings)
4 siblings, 2 replies; 18+ messages in thread
From: Barry Song @ 2026-03-02 11:11 UTC (permalink / raw)
To: Baoquan He
Cc: linux-mm, akpm, chrisl, kasong, shikemeng, nphamcs, youngjun.park
On Mon, Mar 2, 2026 at 6:40 PM Baoquan He <bhe@redhat.com> wrote:
>
> This simplifies codes and makes logic clearer. And also makes later any
> new swap device type being added easier to handle.
>
> Currently there are three types of swap devices: bdev_fs, bdev_sync
> and bdev_async, and only operations read_folio and write_folio are
> included. In the future, there could be more swap device types added
> and more appropriate opeations adapted into swap_ops.
>
> Signed-off-by: Baoquan He <bhe@redhat.com>
> ---
> include/linux/swap.h | 13 ++++++
> mm/swap.h | 1 -
> mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> mm/swapfile.c | 2 +
> mm/zswap.c | 3 +-
> 5 files changed, 76 insertions(+), 45 deletions(-)
>
> diff --git a/include/linux/swap.h b/include/linux/swap.h
> index 0effe3cc50f5..448e5e66ec5c 100644
> --- a/include/linux/swap.h
> +++ b/include/linux/swap.h
> @@ -19,6 +19,7 @@
> struct notifier_block;
>
> struct bio;
> +struct swap_iocb;
>
> struct pagevec;
>
> @@ -222,6 +223,17 @@ enum {
> #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
>
> +struct swap_ops {
> + void (*read_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> + void (*write_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> +};
> +
> +int probe_swap_fs(struct swap_info_struct *sis);
Does probe_swap_fs sound a bit odd?
What about init_swap_ops? Not sure if we have a better name.
Do we really want it, along with swap_ops, to live in
include/linux/swap.h? Could it be placed in mm/swap.h instead?
> +
> /*
> * The first page in the swap file is the swap header, which is always marked
> * bad to prevent it from being allocated as an entry. This also prevents the
> @@ -284,6 +296,7 @@ struct swap_info_struct {
> struct work_struct reclaim_work; /* reclaim worker */
> struct list_head discard_clusters; /* discard clusters list */
> struct plist_node avail_list; /* entry in swap_avail_head */
> + struct swap_ops *ops;
> };
>
> static inline swp_entry_t page_swap_entry(struct page *page)
> diff --git a/mm/swap.h b/mm/swap.h
> index 161185057993..c390df3f5889 100644
> --- a/mm/swap.h
> +++ b/mm/swap.h
> @@ -226,7 +226,6 @@ static inline void swap_read_unplug(struct swap_iocb *plug)
> }
> void swap_write_unplug(struct swap_iocb *sio);
> int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug);
> -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug);
>
> /* linux/mm/swap_state.c */
> extern struct address_space swap_space __read_mostly;
> diff --git a/mm/swap_io.c b/mm/swap_io.c
> index d1cdb10ba133..47077b345ae3 100644
> --- a/mm/swap_io.c
> +++ b/mm/swap_io.c
> @@ -240,6 +240,7 @@ static void swap_zeromap_folio_clear(struct folio *folio)
> int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> {
> int ret = 0;
> + struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
>
> if (folio_free_swap(folio))
> goto out_unlock;
> @@ -281,7 +282,8 @@ int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> return AOP_WRITEPAGE_ACTIVATE;
> }
>
> - __swap_writepage(folio, swap_plug);
> + if (sis->ops && sis->ops->write_folio)
> + sis->ops->write_folio(sis, folio, swap_plug);
Do we want a swap_write_folio() wrapper?
> return 0;
> out_unlock:
> folio_unlock(folio);
> @@ -371,10 +373,11 @@ static void sio_write_complete(struct kiocb *iocb, long ret)
> mempool_free(sio, sio_pool);
> }
>
> -static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> +static void swap_writepage_fs(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **swap_plug)
> {
> struct swap_iocb *sio = swap_plug ? *swap_plug : NULL;
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> struct file *swap_file = sis->swap_file;
> loff_t pos = swap_dev_pos(folio->swap);
>
> @@ -407,8 +410,9 @@ static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> *swap_plug = sio;
> }
>
> -static void swap_writepage_bdev_sync(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_writepage_bdev_sync(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio_vec bv;
> struct bio bio;
> @@ -427,8 +431,9 @@ static void swap_writepage_bdev_sync(struct folio *folio,
> __end_swap_bio_write(&bio);
> }
>
> -static void swap_writepage_bdev_async(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_writepage_bdev_async(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio *bio;
>
> @@ -444,29 +449,6 @@ static void swap_writepage_bdev_async(struct folio *folio,
> submit_bio(bio);
> }
>
> -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug)
> -{
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> -
> - VM_BUG_ON_FOLIO(!folio_test_swapcache(folio), folio);
> - /*
> - * ->flags can be updated non-atomically (scan_swap_map_slots),
> - * but that will never affect SWP_FS_OPS, so the data_race
> - * is safe.
> - */
> - if (data_race(sis->flags & SWP_FS_OPS))
> - swap_writepage_fs(folio, swap_plug);
> - /*
> - * ->flags can be updated non-atomically (scan_swap_map_slots),
> - * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> - * is safe.
> - */
> - else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> - swap_writepage_bdev_sync(folio, sis);
> - else
> - swap_writepage_bdev_async(folio, sis);
> -}
> -
> void swap_write_unplug(struct swap_iocb *sio)
> {
> struct iov_iter from;
> @@ -535,9 +517,10 @@ static bool swap_read_folio_zeromap(struct folio *folio)
> return true;
> }
>
> -static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> +static void swap_read_folio_fs(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> struct swap_iocb *sio = NULL;
> loff_t pos = swap_dev_pos(folio->swap);
>
> @@ -569,8 +552,9 @@ static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> *plug = sio;
> }
>
> -static void swap_read_folio_bdev_sync(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_read_folio_bdev_sync(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio_vec bv;
> struct bio bio;
> @@ -591,8 +575,9 @@ static void swap_read_folio_bdev_sync(struct folio *folio,
> put_task_struct(current);
> }
>
> -static void swap_read_folio_bdev_async(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_read_folio_bdev_async(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio *bio;
>
> @@ -606,6 +591,42 @@ static void swap_read_folio_bdev_async(struct folio *folio,
> submit_bio(bio);
> }
>
> +static struct swap_ops bdev_fs_swap_ops = {
> + .read_folio = swap_read_folio_fs,
> + .write_folio = swap_writepage_fs,
> +};
const?
> +
> +static struct swap_ops bdev_sync_swap_ops = {
> + .read_folio = swap_read_folio_bdev_sync,
> + .write_folio = swap_writepage_bdev_sync,
> +};
const?
> +
> +static struct swap_ops bdev_async_swap_ops = {
> + .read_folio = swap_read_folio_bdev_async,
> + .write_folio = swap_writepage_bdev_async,
> +};
const?
> +
> +int probe_swap_fs(struct swap_info_struct *sis)
> +{
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_FS_OPS, so the data_race
> + * is safe.
> + */
> + if (data_race(sis->flags & SWP_FS_OPS))
> + sis->ops = &bdev_fs_swap_ops;
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> + * is safe.
> + */
> + else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> + sis->ops = &bdev_sync_swap_ops;
> + else
> + sis->ops = &bdev_async_swap_ops;
> + return 0;
> +}
> +
> void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> {
> struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> @@ -640,13 +661,8 @@ void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> /* We have to read from slower devices. Increase zswap protection. */
> zswap_folio_swapin(folio);
>
> - if (data_race(sis->flags & SWP_FS_OPS)) {
> - swap_read_folio_fs(folio, plug);
> - } else if (synchronous) {
> - swap_read_folio_bdev_sync(folio, sis);
> - } else {
> - swap_read_folio_bdev_async(folio, sis);
> - }
> + if (sis->ops && sis->ops->read_folio)
> + sis->ops->read_folio(sis, folio, plug);
>
> finish:
> if (workingset) {
> diff --git a/mm/swapfile.c b/mm/swapfile.c
> index 915bc93964db..af498f9af328 100644
> --- a/mm/swapfile.c
> +++ b/mm/swapfile.c
> @@ -3625,6 +3625,8 @@ SYSCALL_DEFINE2(swapon, const char __user *, specialfile, int, swap_flags)
> /* Sets SWP_WRITEOK, resurrect the percpu ref, expose the swap device */
> enable_swap_info(si);
>
> + probe_swap_fs(si);
Can we move this to enable_swap_info(), or perhaps even
deeper into setup_swap_info()?
> +
> pr_info("Adding %uk swap on %s. Priority:%d extents:%d across:%lluk %s%s%s%s\n",
> K(si->pages), name->name, si->prio, nr_extents,
> K((unsigned long long)span),
> diff --git a/mm/zswap.c b/mm/zswap.c
> index a399f7a10830..7ce906249c7a 100644
> --- a/mm/zswap.c
> +++ b/mm/zswap.c
> @@ -1055,7 +1055,8 @@ static int zswap_writeback_entry(struct zswap_entry *entry,
> folio_set_reclaim(folio);
>
> /* start writeback */
> - __swap_writepage(folio, NULL);
> + if (si->ops && si->ops->write_folio)
> + si->ops->write_folio(si, folio, NULL);
swap_write_folio() inline wrapper?
>
> out:
> if (ret && ret != -EEXIST) {
> --
> 2.52.0
>
Thanks
Barry
^ permalink raw reply [flat|nested] 18+ messages in thread* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 11:11 ` Barry Song
@ 2026-03-02 14:47 ` Baoquan He
2026-03-02 19:28 ` Chris Li
1 sibling, 0 replies; 18+ messages in thread
From: Baoquan He @ 2026-03-02 14:47 UTC (permalink / raw)
To: Barry Song
Cc: linux-mm, akpm, chrisl, kasong, shikemeng, nphamcs, youngjun.park
On 03/02/26 at 07:11pm, Barry Song wrote:
> On Mon, Mar 2, 2026 at 6:40 PM Baoquan He <bhe@redhat.com> wrote:
> >
> > This simplifies codes and makes logic clearer. And also makes later any
> > new swap device type being added easier to handle.
> >
> > Currently there are three types of swap devices: bdev_fs, bdev_sync
> > and bdev_async, and only operations read_folio and write_folio are
> > included. In the future, there could be more swap device types added
> > and more appropriate opeations adapted into swap_ops.
> >
> > Signed-off-by: Baoquan He <bhe@redhat.com>
> > ---
> > include/linux/swap.h | 13 ++++++
> > mm/swap.h | 1 -
> > mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> > mm/swapfile.c | 2 +
> > mm/zswap.c | 3 +-
> > 5 files changed, 76 insertions(+), 45 deletions(-)
> >
> > diff --git a/include/linux/swap.h b/include/linux/swap.h
> > index 0effe3cc50f5..448e5e66ec5c 100644
> > --- a/include/linux/swap.h
> > +++ b/include/linux/swap.h
> > @@ -19,6 +19,7 @@
> > struct notifier_block;
> >
> > struct bio;
> > +struct swap_iocb;
> >
> > struct pagevec;
> >
> > @@ -222,6 +223,17 @@ enum {
> > #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> > #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
> >
> > +struct swap_ops {
> > + void (*read_folio)(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug);
> > + void (*write_folio)(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug);
> > +};
> > +
> > +int probe_swap_fs(struct swap_info_struct *sis);
>
> Does probe_swap_fs sound a bit odd?
> What about init_swap_ops? Not sure if we have a better name.
Both is fine to me, if no other suggestion, I can take init_swap_ops()
instead.
>
> Do we really want it, along with swap_ops, to live in
> include/linux/swap.h? Could it be placed in mm/swap.h instead?
You are right, putting it into mm/swap.h sounds better.
>
> > +
> > /*
> > * The first page in the swap file is the swap header, which is always marked
> > * bad to prevent it from being allocated as an entry. This also prevents the
> > @@ -284,6 +296,7 @@ struct swap_info_struct {
> > struct work_struct reclaim_work; /* reclaim worker */
> > struct list_head discard_clusters; /* discard clusters list */
> > struct plist_node avail_list; /* entry in swap_avail_head */
> > + struct swap_ops *ops;
> > };
> >
> > static inline swp_entry_t page_swap_entry(struct page *page)
> > diff --git a/mm/swap.h b/mm/swap.h
> > index 161185057993..c390df3f5889 100644
> > --- a/mm/swap.h
> > +++ b/mm/swap.h
> > @@ -226,7 +226,6 @@ static inline void swap_read_unplug(struct swap_iocb *plug)
> > }
> > void swap_write_unplug(struct swap_iocb *sio);
> > int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug);
> > -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug);
> >
> > /* linux/mm/swap_state.c */
> > extern struct address_space swap_space __read_mostly;
> > diff --git a/mm/swap_io.c b/mm/swap_io.c
> > index d1cdb10ba133..47077b345ae3 100644
> > --- a/mm/swap_io.c
> > +++ b/mm/swap_io.c
> > @@ -240,6 +240,7 @@ static void swap_zeromap_folio_clear(struct folio *folio)
> > int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> > {
> > int ret = 0;
> > + struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> >
> > if (folio_free_swap(folio))
> > goto out_unlock;
> > @@ -281,7 +282,8 @@ int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> > return AOP_WRITEPAGE_ACTIVATE;
> > }
> >
> > - __swap_writepage(folio, swap_plug);
> > + if (sis->ops && sis->ops->write_folio)
> > + sis->ops->write_folio(sis, folio, swap_plug);
>
> Do we want a swap_write_folio() wrapper?
Seems swap_writeout() is the counterpart of swap_read_folio(). I
personally prefer to rename swap_writeout() to swap_write_folio(). And
make a wrapper as _swap_write_folio()?
>
> > return 0;
> > out_unlock:
> > folio_unlock(folio);
> > @@ -371,10 +373,11 @@ static void sio_write_complete(struct kiocb *iocb, long ret)
> > mempool_free(sio, sio_pool);
> > }
> >
> > -static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> > +static void swap_writepage_fs(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **swap_plug)
> > {
> > struct swap_iocb *sio = swap_plug ? *swap_plug : NULL;
> > - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > struct file *swap_file = sis->swap_file;
> > loff_t pos = swap_dev_pos(folio->swap);
> >
> > @@ -407,8 +410,9 @@ static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> > *swap_plug = sio;
> > }
> >
> > -static void swap_writepage_bdev_sync(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_writepage_bdev_sync(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio_vec bv;
> > struct bio bio;
> > @@ -427,8 +431,9 @@ static void swap_writepage_bdev_sync(struct folio *folio,
> > __end_swap_bio_write(&bio);
> > }
> >
> > -static void swap_writepage_bdev_async(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_writepage_bdev_async(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio *bio;
> >
> > @@ -444,29 +449,6 @@ static void swap_writepage_bdev_async(struct folio *folio,
> > submit_bio(bio);
> > }
> >
> > -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug)
> > -{
> > - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > -
> > - VM_BUG_ON_FOLIO(!folio_test_swapcache(folio), folio);
> > - /*
> > - * ->flags can be updated non-atomically (scan_swap_map_slots),
> > - * but that will never affect SWP_FS_OPS, so the data_race
> > - * is safe.
> > - */
> > - if (data_race(sis->flags & SWP_FS_OPS))
> > - swap_writepage_fs(folio, swap_plug);
> > - /*
> > - * ->flags can be updated non-atomically (scan_swap_map_slots),
> > - * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> > - * is safe.
> > - */
> > - else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> > - swap_writepage_bdev_sync(folio, sis);
> > - else
> > - swap_writepage_bdev_async(folio, sis);
> > -}
> > -
> > void swap_write_unplug(struct swap_iocb *sio)
> > {
> > struct iov_iter from;
> > @@ -535,9 +517,10 @@ static bool swap_read_folio_zeromap(struct folio *folio)
> > return true;
> > }
> >
> > -static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> > +static void swap_read_folio_fs(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > struct swap_iocb *sio = NULL;
> > loff_t pos = swap_dev_pos(folio->swap);
> >
> > @@ -569,8 +552,9 @@ static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> > *plug = sio;
> > }
> >
> > -static void swap_read_folio_bdev_sync(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_read_folio_bdev_sync(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio_vec bv;
> > struct bio bio;
> > @@ -591,8 +575,9 @@ static void swap_read_folio_bdev_sync(struct folio *folio,
> > put_task_struct(current);
> > }
> >
> > -static void swap_read_folio_bdev_async(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_read_folio_bdev_async(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio *bio;
> >
> > @@ -606,6 +591,42 @@ static void swap_read_folio_bdev_async(struct folio *folio,
> > submit_bio(bio);
> > }
> >
> > +static struct swap_ops bdev_fs_swap_ops = {
> > + .read_folio = swap_read_folio_fs,
> > + .write_folio = swap_writepage_fs,
> > +};
>
> const?
Right, will fix in v2.
>
> > +
> > +static struct swap_ops bdev_sync_swap_ops = {
> > + .read_folio = swap_read_folio_bdev_sync,
> > + .write_folio = swap_writepage_bdev_sync,
> > +};
>
> const?
>
> > +
> > +static struct swap_ops bdev_async_swap_ops = {
> > + .read_folio = swap_read_folio_bdev_async,
> > + .write_folio = swap_writepage_bdev_async,
> > +};
>
> const?
>
> > +
> > +int probe_swap_fs(struct swap_info_struct *sis)
> > +{
> > + /*
> > + * ->flags can be updated non-atomically (scan_swap_map_slots),
> > + * but that will never affect SWP_FS_OPS, so the data_race
> > + * is safe.
> > + */
> > + if (data_race(sis->flags & SWP_FS_OPS))
> > + sis->ops = &bdev_fs_swap_ops;
> > + /*
> > + * ->flags can be updated non-atomically (scan_swap_map_slots),
> > + * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> > + * is safe.
> > + */
> > + else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> > + sis->ops = &bdev_sync_swap_ops;
> > + else
> > + sis->ops = &bdev_async_swap_ops;
> > + return 0;
> > +}
> > +
> > void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> > {
> > struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > @@ -640,13 +661,8 @@ void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> > /* We have to read from slower devices. Increase zswap protection. */
> > zswap_folio_swapin(folio);
> >
> > - if (data_race(sis->flags & SWP_FS_OPS)) {
> > - swap_read_folio_fs(folio, plug);
> > - } else if (synchronous) {
> > - swap_read_folio_bdev_sync(folio, sis);
> > - } else {
> > - swap_read_folio_bdev_async(folio, sis);
> > - }
> > + if (sis->ops && sis->ops->read_folio)
> > + sis->ops->read_folio(sis, folio, plug);
> >
> > finish:
> > if (workingset) {
> > diff --git a/mm/swapfile.c b/mm/swapfile.c
> > index 915bc93964db..af498f9af328 100644
> > --- a/mm/swapfile.c
> > +++ b/mm/swapfile.c
> > @@ -3625,6 +3625,8 @@ SYSCALL_DEFINE2(swapon, const char __user *, specialfile, int, swap_flags)
> > /* Sets SWP_WRITEOK, resurrect the percpu ref, expose the swap device */
> > enable_swap_info(si);
> >
> > + probe_swap_fs(si);
>
> Can we move this to enable_swap_info(), or perhaps even
> deeper into setup_swap_info()?
>
> > +
> > pr_info("Adding %uk swap on %s. Priority:%d extents:%d across:%lluk %s%s%s%s\n",
> > K(si->pages), name->name, si->prio, nr_extents,
> > K((unsigned long long)span),
> > diff --git a/mm/zswap.c b/mm/zswap.c
> > index a399f7a10830..7ce906249c7a 100644
> > --- a/mm/zswap.c
> > +++ b/mm/zswap.c
> > @@ -1055,7 +1055,8 @@ static int zswap_writeback_entry(struct zswap_entry *entry,
> > folio_set_reclaim(folio);
> >
> > /* start writeback */
> > - __swap_writepage(folio, NULL);
> > + if (si->ops && si->ops->write_folio)
> > + si->ops->write_folio(si, folio, NULL);
>
> swap_write_folio() inline wrapper?
Replied at above place. We will need a read_folio version too.
^ permalink raw reply [flat|nested] 18+ messages in thread* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 11:11 ` Barry Song
2026-03-02 14:47 ` Baoquan He
@ 2026-03-02 19:28 ` Chris Li
1 sibling, 0 replies; 18+ messages in thread
From: Chris Li @ 2026-03-02 19:28 UTC (permalink / raw)
To: Barry Song
Cc: Baoquan He, linux-mm, akpm, kasong, shikemeng, nphamcs, youngjun.park
On Mon, Mar 2, 2026 at 3:11 AM Barry Song <21cnbao@gmail.com> wrote:
>
> On Mon, Mar 2, 2026 at 6:40 PM Baoquan He <bhe@redhat.com> wrote:
> >
> > This simplifies codes and makes logic clearer. And also makes later any
> > new swap device type being added easier to handle.
> >
> > Currently there are three types of swap devices: bdev_fs, bdev_sync
> > and bdev_async, and only operations read_folio and write_folio are
> > included. In the future, there could be more swap device types added
> > and more appropriate opeations adapted into swap_ops.
> >
> > Signed-off-by: Baoquan He <bhe@redhat.com>
Thanks for sending this series out for discussion.
> > ---
> > include/linux/swap.h | 13 ++++++
> > mm/swap.h | 1 -
> > mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> > mm/swapfile.c | 2 +
> > mm/zswap.c | 3 +-
> > 5 files changed, 76 insertions(+), 45 deletions(-)
> >
> > diff --git a/include/linux/swap.h b/include/linux/swap.h
> > index 0effe3cc50f5..448e5e66ec5c 100644
> > --- a/include/linux/swap.h
> > +++ b/include/linux/swap.h
> > @@ -19,6 +19,7 @@
> > struct notifier_block;
> >
> > struct bio;
> > +struct swap_iocb;
> >
> > struct pagevec;
> >
> > @@ -222,6 +223,17 @@ enum {
> > #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> > #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
> >
> > +struct swap_ops {
> > + void (*read_folio)(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug);
> > + void (*write_folio)(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug);
> > +};
> > +
> > +int probe_swap_fs(struct swap_info_struct *sis);
>
> Does probe_swap_fs sound a bit odd?
> What about init_swap_ops? Not sure if we have a better name.
We can also call probe_swap_header(), which effectively detects which
implementation of the swap device operations the header requesting.
> Do we really want it, along with swap_ops, to live in
> include/linux/swap.h? Could it be placed in mm/swap.h instead?
That is a good point. The mm/swap.h is likely better (if possible)
for the swap_ops related declaration because all those ops are
internal swap behavior. We can move out later if there is a reason.
>
> > +
> > /*
> > * The first page in the swap file is the swap header, which is always marked
> > * bad to prevent it from being allocated as an entry. This also prevents the
> > @@ -284,6 +296,7 @@ struct swap_info_struct {
> > struct work_struct reclaim_work; /* reclaim worker */
> > struct list_head discard_clusters; /* discard clusters list */
> > struct plist_node avail_list; /* entry in swap_avail_head */
> > + struct swap_ops *ops;
> > };
> >
> > static inline swp_entry_t page_swap_entry(struct page *page)
> > diff --git a/mm/swap.h b/mm/swap.h
> > index 161185057993..c390df3f5889 100644
> > --- a/mm/swap.h
> > +++ b/mm/swap.h
> > @@ -226,7 +226,6 @@ static inline void swap_read_unplug(struct swap_iocb *plug)
> > }
> > void swap_write_unplug(struct swap_iocb *sio);
> > int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug);
> > -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug);
> >
> > /* linux/mm/swap_state.c */
> > extern struct address_space swap_space __read_mostly;
> > diff --git a/mm/swap_io.c b/mm/swap_io.c
> > index d1cdb10ba133..47077b345ae3 100644
> > --- a/mm/swap_io.c
> > +++ b/mm/swap_io.c
> > @@ -240,6 +240,7 @@ static void swap_zeromap_folio_clear(struct folio *folio)
> > int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> > {
> > int ret = 0;
> > + struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> >
> > if (folio_free_swap(folio))
> > goto out_unlock;
> > @@ -281,7 +282,8 @@ int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> > return AOP_WRITEPAGE_ACTIVATE;
> > }
> >
> > - __swap_writepage(folio, swap_plug);
> > + if (sis->ops && sis->ops->write_folio)
> > + sis->ops->write_folio(sis, folio, swap_plug);
>
> Do we want a swap_write_folio() wrapper?
I vote that it is better to keep these two lines as they are. No
wrapper is needed. Is that wrapper used in only two places? Also we
have too many swap_write_page/folio-like functions. Adding one doesn't
provide enough value, it is likely causing more energy to distingish
with the other similar functions.
> > return 0;
> > out_unlock:
> > folio_unlock(folio);
> > @@ -371,10 +373,11 @@ static void sio_write_complete(struct kiocb *iocb, long ret)
> > mempool_free(sio, sio_pool);
> > }
> >
> > -static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> > +static void swap_writepage_fs(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **swap_plug)
> > {
> > struct swap_iocb *sio = swap_plug ? *swap_plug : NULL;
> > - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > struct file *swap_file = sis->swap_file;
> > loff_t pos = swap_dev_pos(folio->swap);
> >
> > @@ -407,8 +410,9 @@ static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> > *swap_plug = sio;
> > }
> >
> > -static void swap_writepage_bdev_sync(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_writepage_bdev_sync(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio_vec bv;
> > struct bio bio;
> > @@ -427,8 +431,9 @@ static void swap_writepage_bdev_sync(struct folio *folio,
> > __end_swap_bio_write(&bio);
> > }
> >
> > -static void swap_writepage_bdev_async(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_writepage_bdev_async(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio *bio;
> >
> > @@ -444,29 +449,6 @@ static void swap_writepage_bdev_async(struct folio *folio,
> > submit_bio(bio);
> > }
> >
> > -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug)
> > -{
> > - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > -
> > - VM_BUG_ON_FOLIO(!folio_test_swapcache(folio), folio);
> > - /*
> > - * ->flags can be updated non-atomically (scan_swap_map_slots),
> > - * but that will never affect SWP_FS_OPS, so the data_race
> > - * is safe.
> > - */
> > - if (data_race(sis->flags & SWP_FS_OPS))
> > - swap_writepage_fs(folio, swap_plug);
> > - /*
> > - * ->flags can be updated non-atomically (scan_swap_map_slots),
> > - * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> > - * is safe.
> > - */
> > - else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> > - swap_writepage_bdev_sync(folio, sis);
> > - else
> > - swap_writepage_bdev_async(folio, sis);
> > -}
> > -
> > void swap_write_unplug(struct swap_iocb *sio)
> > {
> > struct iov_iter from;
> > @@ -535,9 +517,10 @@ static bool swap_read_folio_zeromap(struct folio *folio)
> > return true;
> > }
> >
> > -static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> > +static void swap_read_folio_fs(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > struct swap_iocb *sio = NULL;
> > loff_t pos = swap_dev_pos(folio->swap);
> >
> > @@ -569,8 +552,9 @@ static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> > *plug = sio;
> > }
> >
> > -static void swap_read_folio_bdev_sync(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_read_folio_bdev_sync(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio_vec bv;
> > struct bio bio;
> > @@ -591,8 +575,9 @@ static void swap_read_folio_bdev_sync(struct folio *folio,
> > put_task_struct(current);
> > }
> >
> > -static void swap_read_folio_bdev_async(struct folio *folio,
> > - struct swap_info_struct *sis)
> > +static void swap_read_folio_bdev_async(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug)
> > {
> > struct bio *bio;
> >
> > @@ -606,6 +591,42 @@ static void swap_read_folio_bdev_async(struct folio *folio,
> > submit_bio(bio);
> > }
> >
> > +static struct swap_ops bdev_fs_swap_ops = {
> > + .read_folio = swap_read_folio_fs,
> > + .write_folio = swap_writepage_fs,
> > +};
>
> const?
>
> > +
> > +static struct swap_ops bdev_sync_swap_ops = {
> > + .read_folio = swap_read_folio_bdev_sync,
> > + .write_folio = swap_writepage_bdev_sync,
> > +};
>
> const?
>
> > +
> > +static struct swap_ops bdev_async_swap_ops = {
> > + .read_folio = swap_read_folio_bdev_async,
> > + .write_folio = swap_writepage_bdev_async,
> > +};
>
> const?
>
> > +
> > +int probe_swap_fs(struct swap_info_struct *sis)
> > +{
> > + /*
> > + * ->flags can be updated non-atomically (scan_swap_map_slots),
> > + * but that will never affect SWP_FS_OPS, so the data_race
> > + * is safe.
> > + */
> > + if (data_race(sis->flags & SWP_FS_OPS))
> > + sis->ops = &bdev_fs_swap_ops;
> > + /*
> > + * ->flags can be updated non-atomically (scan_swap_map_slots),
> > + * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> > + * is safe.
> > + */
> > + else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> > + sis->ops = &bdev_sync_swap_ops;
> > + else
> > + sis->ops = &bdev_async_swap_ops;
> > + return 0;
> > +}
> > +
> > void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> > {
> > struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> > @@ -640,13 +661,8 @@ void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> > /* We have to read from slower devices. Increase zswap protection. */
> > zswap_folio_swapin(folio);
> >
> > - if (data_race(sis->flags & SWP_FS_OPS)) {
> > - swap_read_folio_fs(folio, plug);
> > - } else if (synchronous) {
> > - swap_read_folio_bdev_sync(folio, sis);
> > - } else {
> > - swap_read_folio_bdev_async(folio, sis);
> > - }
> > + if (sis->ops && sis->ops->read_folio)
> > + sis->ops->read_folio(sis, folio, plug);
> >
> > finish:
> > if (workingset) {
> > diff --git a/mm/swapfile.c b/mm/swapfile.c
> > index 915bc93964db..af498f9af328 100644
> > --- a/mm/swapfile.c
> > +++ b/mm/swapfile.c
> > @@ -3625,6 +3625,8 @@ SYSCALL_DEFINE2(swapon, const char __user *, specialfile, int, swap_flags)
> > /* Sets SWP_WRITEOK, resurrect the percpu ref, expose the swap device */
> > enable_swap_info(si);
> >
> > + probe_swap_fs(si);
>
> Can we move this to enable_swap_info(), or perhaps even
> deeper into setup_swap_info()?
>
> > +
> > pr_info("Adding %uk swap on %s. Priority:%d extents:%d across:%lluk %s%s%s%s\n",
> > K(si->pages), name->name, si->prio, nr_extents,
> > K((unsigned long long)span),
> > diff --git a/mm/zswap.c b/mm/zswap.c
> > index a399f7a10830..7ce906249c7a 100644
> > --- a/mm/zswap.c
> > +++ b/mm/zswap.c
> > @@ -1055,7 +1055,8 @@ static int zswap_writeback_entry(struct zswap_entry *entry,
> > folio_set_reclaim(folio);
> >
> > /* start writeback */
> > - __swap_writepage(folio, NULL);
> > + if (si->ops && si->ops->write_folio)
> > + si->ops->write_folio(si, folio, NULL);
>
> swap_write_folio() inline wrapper?
Again, I think keeping it as is is fine.
Chris
^ permalink raw reply [flat|nested] 18+ messages in thread
* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 10:40 ` [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods Baoquan He
2026-03-02 11:11 ` Barry Song
@ 2026-03-02 12:20 ` YoungJun Park
2026-03-02 14:09 ` YoungJun Park
` (2 subsequent siblings)
4 siblings, 0 replies; 18+ messages in thread
From: YoungJun Park @ 2026-03-02 12:20 UTC (permalink / raw)
To: Baoquan He; +Cc: linux-mm, akpm, chrisl, kasong, shikemeng, nphamcs, baohua
On Mon, Mar 02, 2026 at 06:40:15PM +0800, Baoquan He wrote:
Hello Baoquan!
...
> + .read_folio = swap_read_folio_bdev_sync,
> + .write_folio = swap_writepage_bdev_sync,
> +};
> +
> +static struct swap_ops bdev_async_swap_ops = {
> + .read_folio = swap_read_folio_bdev_async,
> + .write_folio = swap_writepage_bdev_async,
> +};
> +
> +int probe_swap_fs(struct swap_info_struct *sis)
> +{
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_FS_OPS, so the data_race
> + * is safe.
> + */
> + if (data_race(sis->flags & SWP_FS_OPS))
> + sis->ops = &bdev_fs_swap_ops;
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> + * is safe.
> + */
The reference to scan_swap_map_slots appears to be outdated as the
function no longer exists in the current codebase. It might be
better to update this to a more generic term?
If comments are needed to be updated,
Similar comments in may_enter_fs likely need a similar update
for consistency.
> + else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> + sis->ops = &bdev_sync_swap_ops;
> + else
> + sis->ops = &bdev_async_swap_ops;
> + return 0;
it seems return value is not needed.
Thanks
Youngjun Park
^ permalink raw reply [flat|nested] 18+ messages in thread* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 10:40 ` [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods Baoquan He
2026-03-02 11:11 ` Barry Song
2026-03-02 12:20 ` YoungJun Park
@ 2026-03-02 14:09 ` YoungJun Park
2026-03-02 19:35 ` Chris Li
2026-03-02 14:53 ` Usama Arif
2026-03-02 21:21 ` Nhat Pham
4 siblings, 1 reply; 18+ messages in thread
From: YoungJun Park @ 2026-03-02 14:09 UTC (permalink / raw)
To: Baoquan He; +Cc: linux-mm, akpm, chrisl, kasong, shikemeng, nphamcs, baohua
On Mon, Mar 02, 2026 at 06:40:15PM +0800, Baoquan He wrote:
> This simplifies codes and makes logic clearer. And also makes later any
> new swap device type being added easier to handle.
>
> Currently there are three types of swap devices: bdev_fs, bdev_sync
> and bdev_async, and only operations read_folio and write_folio are
> included. In the future, there could be more swap device types added
> and more appropriate opeations adapted into swap_ops.
>
> Signed-off-by: Baoquan He <bhe@redhat.com>
> ---
> include/linux/swap.h | 13 ++++++
> mm/swap.h | 1 -
> mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> mm/swapfile.c | 2 +
> mm/zswap.c | 3 +-
> 5 files changed, 76 insertions(+), 45 deletions(-)
>
> diff --git a/include/linux/swap.h b/include/linux/swap.h
> index 0effe3cc50f5..448e5e66ec5c 100644
> --- a/include/linux/swap.h
> +++ b/include/linux/swap.h
> @@ -19,6 +19,7 @@
> struct notifier_block;
>
> struct bio;
> +struct swap_iocb;
>
> struct pagevec;
>
> @@ -222,6 +223,17 @@ enum {
> #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
>
> +struct swap_ops {
> + void (*read_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> + void (*write_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> +};
I think swap_iocb is only required for fs-swap
(swap_folio_read_fs/swap_folio_write_fs).
If the goal is to support fs-swap through swap_ops, it might be worth
considering a more complete integration, including activate/deactivate
and swap_rw from aops, rather than only adding read/write hooks.
So.. we could keep SWP_FS_OPS as-is for now and just split
sync/async paths, and revisit a cleaner fs-swap integration later.
(I mean removing fs ops, and call swap_read/write_folio_fs on sync/async ops.)
How do you think?
Thanks
Youngjun Park
^ permalink raw reply [flat|nested] 18+ messages in thread* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 14:09 ` YoungJun Park
@ 2026-03-02 19:35 ` Chris Li
0 siblings, 0 replies; 18+ messages in thread
From: Chris Li @ 2026-03-02 19:35 UTC (permalink / raw)
To: YoungJun Park
Cc: Baoquan He, linux-mm, akpm, kasong, shikemeng, nphamcs, baohua
On Mon, Mar 2, 2026 at 6:10 AM YoungJun Park <youngjun.park@lge.com> wrote:
>
> On Mon, Mar 02, 2026 at 06:40:15PM +0800, Baoquan He wrote:
> > This simplifies codes and makes logic clearer. And also makes later any
> > new swap device type being added easier to handle.
> >
> > Currently there are three types of swap devices: bdev_fs, bdev_sync
> > and bdev_async, and only operations read_folio and write_folio are
> > included. In the future, there could be more swap device types added
> > and more appropriate opeations adapted into swap_ops.
> >
> > Signed-off-by: Baoquan He <bhe@redhat.com>
> > ---
> > include/linux/swap.h | 13 ++++++
> > mm/swap.h | 1 -
> > mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> > mm/swapfile.c | 2 +
> > mm/zswap.c | 3 +-
> > 5 files changed, 76 insertions(+), 45 deletions(-)
> >
> > diff --git a/include/linux/swap.h b/include/linux/swap.h
> > index 0effe3cc50f5..448e5e66ec5c 100644
> > --- a/include/linux/swap.h
> > +++ b/include/linux/swap.h
> > @@ -19,6 +19,7 @@
> > struct notifier_block;
> >
> > struct bio;
> > +struct swap_iocb;
> >
> > struct pagevec;
> >
> > @@ -222,6 +223,17 @@ enum {
> > #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> > #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
> >
> > +struct swap_ops {
> > + void (*read_folio)(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug);
> > + void (*write_folio)(struct swap_info_struct *sis,
> > + struct folio *folio,
> > + struct swap_iocb **plug);
> > +};
>
> I think swap_iocb is only required for fs-swap
> (swap_folio_read_fs/swap_folio_write_fs).
>
> If the goal is to support fs-swap through swap_ops, it might be worth
Consider this series as a starting point for discussion. Nothing is
set to stone.
> considering a more complete integration, including activate/deactivate
> and swap_rw from aops, rather than only adding read/write hooks.
Can be add as follow up patches to introduce active/deactive and
swap_rw from aops. In fact I want to see it as incremental patches
rather than add every possible swap_ops in one go. It is likely easier
to review as well.
>
> So.. we could keep SWP_FS_OPS as-is for now and just split
> sync/async paths, and revisit a cleaner fs-swap integration later.
> (I mean removing fs ops, and call swap_read/write_folio_fs on sync/async ops.)
You can propose incremental patches to add your additional swap ops
and into the series as the later iteration.
The sync/async split is just a MVP to introduce the first step of the swap_ops.
Chris
^ permalink raw reply [flat|nested] 18+ messages in thread
* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 10:40 ` [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods Baoquan He
` (2 preceding siblings ...)
2026-03-02 14:09 ` YoungJun Park
@ 2026-03-02 14:53 ` Usama Arif
2026-03-02 21:21 ` Nhat Pham
4 siblings, 0 replies; 18+ messages in thread
From: Usama Arif @ 2026-03-02 14:53 UTC (permalink / raw)
To: Baoquan He
Cc: Usama Arif, linux-mm, akpm, chrisl, kasong, shikemeng, nphamcs,
baohua, youngjun.park
On Mon, 2 Mar 2026 18:40:15 +0800 Baoquan He <bhe@redhat.com> wrote:
> This simplifies codes and makes logic clearer. And also makes later any
> new swap device type being added easier to handle.
>
> Currently there are three types of swap devices: bdev_fs, bdev_sync
> and bdev_async, and only operations read_folio and write_folio are
> included. In the future, there could be more swap device types added
> and more appropriate opeations adapted into swap_ops.
>
> Signed-off-by: Baoquan He <bhe@redhat.com>
> ---
> include/linux/swap.h | 13 ++++++
> mm/swap.h | 1 -
> mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> mm/swapfile.c | 2 +
> mm/zswap.c | 3 +-
> 5 files changed, 76 insertions(+), 45 deletions(-)
>
> diff --git a/include/linux/swap.h b/include/linux/swap.h
> index 0effe3cc50f5..448e5e66ec5c 100644
> --- a/include/linux/swap.h
> +++ b/include/linux/swap.h
> @@ -19,6 +19,7 @@
> struct notifier_block;
>
> struct bio;
> +struct swap_iocb;
>
> struct pagevec;
>
> @@ -222,6 +223,17 @@ enum {
> #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
>
> +struct swap_ops {
> + void (*read_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> + void (*write_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> +};
> +
> +int probe_swap_fs(struct swap_info_struct *sis);
> +
Would it be better to put these in mm/swap.h as they are only used in mm/?
> /*
> * The first page in the swap file is the swap header, which is always marked
> * bad to prevent it from being allocated as an entry. This also prevents the
> @@ -284,6 +296,7 @@ struct swap_info_struct {
> struct work_struct reclaim_work; /* reclaim worker */
> struct list_head discard_clusters; /* discard clusters list */
> struct plist_node avail_list; /* entry in swap_avail_head */
> + struct swap_ops *ops;
> };
>
> static inline swp_entry_t page_swap_entry(struct page *page)
> diff --git a/mm/swap.h b/mm/swap.h
> index 161185057993..c390df3f5889 100644
> --- a/mm/swap.h
> +++ b/mm/swap.h
> @@ -226,7 +226,6 @@ static inline void swap_read_unplug(struct swap_iocb *plug)
> }
> void swap_write_unplug(struct swap_iocb *sio);
> int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug);
> -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug);
>
> /* linux/mm/swap_state.c */
> extern struct address_space swap_space __read_mostly;
> diff --git a/mm/swap_io.c b/mm/swap_io.c
> index d1cdb10ba133..47077b345ae3 100644
> --- a/mm/swap_io.c
> +++ b/mm/swap_io.c
> @@ -240,6 +240,7 @@ static void swap_zeromap_folio_clear(struct folio *folio)
> int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> {
> int ret = 0;
> + struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
>
> if (folio_free_swap(folio))
> goto out_unlock;
> @@ -281,7 +282,8 @@ int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> return AOP_WRITEPAGE_ACTIVATE;
> }
>
> - __swap_writepage(folio, swap_plug);
> + if (sis->ops && sis->ops->write_folio)
> + sis->ops->write_folio(sis, folio, swap_plug);
The old __swap_writepage() always dispatched to one of the three write
functions unconditionally. If the guard condition is false (ops is NULL),
swap_writeout() returns 0 (success) but the folio is never unlocked --
the write functions are the ones that call folio_unlock(). Would this
leave the folio locked and lead to a deadlock? Similar issue in swap_read_folio.
> return 0;
> out_unlock:
> folio_unlock(folio);
> @@ -371,10 +373,11 @@ static void sio_write_complete(struct kiocb *iocb, long ret)
> mempool_free(sio, sio_pool);
> }
>
> -static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> +static void swap_writepage_fs(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **swap_plug)
> {
> struct swap_iocb *sio = swap_plug ? *swap_plug : NULL;
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> struct file *swap_file = sis->swap_file;
> loff_t pos = swap_dev_pos(folio->swap);
>
> @@ -407,8 +410,9 @@ static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> *swap_plug = sio;
> }
>
> -static void swap_writepage_bdev_sync(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_writepage_bdev_sync(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio_vec bv;
> struct bio bio;
> @@ -427,8 +431,9 @@ static void swap_writepage_bdev_sync(struct folio *folio,
> __end_swap_bio_write(&bio);
> }
>
> -static void swap_writepage_bdev_async(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_writepage_bdev_async(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio *bio;
>
> @@ -444,29 +449,6 @@ static void swap_writepage_bdev_async(struct folio *folio,
> submit_bio(bio);
> }
>
> -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug)
> -{
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> -
> - VM_BUG_ON_FOLIO(!folio_test_swapcache(folio), folio);
> - /*
> - * ->flags can be updated non-atomically (scan_swap_map_slots),
> - * but that will never affect SWP_FS_OPS, so the data_race
> - * is safe.
> - */
> - if (data_race(sis->flags & SWP_FS_OPS))
> - swap_writepage_fs(folio, swap_plug);
> - /*
> - * ->flags can be updated non-atomically (scan_swap_map_slots),
> - * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> - * is safe.
> - */
> - else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> - swap_writepage_bdev_sync(folio, sis);
> - else
> - swap_writepage_bdev_async(folio, sis);
> -}
> -
> void swap_write_unplug(struct swap_iocb *sio)
> {
> struct iov_iter from;
> @@ -535,9 +517,10 @@ static bool swap_read_folio_zeromap(struct folio *folio)
> return true;
> }
>
> -static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> +static void swap_read_folio_fs(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> struct swap_iocb *sio = NULL;
> loff_t pos = swap_dev_pos(folio->swap);
>
> @@ -569,8 +552,9 @@ static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> *plug = sio;
> }
>
> -static void swap_read_folio_bdev_sync(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_read_folio_bdev_sync(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio_vec bv;
> struct bio bio;
> @@ -591,8 +575,9 @@ static void swap_read_folio_bdev_sync(struct folio *folio,
> put_task_struct(current);
> }
>
> -static void swap_read_folio_bdev_async(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_read_folio_bdev_async(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio *bio;
>
> @@ -606,6 +591,42 @@ static void swap_read_folio_bdev_async(struct folio *folio,
> submit_bio(bio);
> }
>
> +static struct swap_ops bdev_fs_swap_ops = {
> + .read_folio = swap_read_folio_fs,
> + .write_folio = swap_writepage_fs,
> +};
> +
> +static struct swap_ops bdev_sync_swap_ops = {
> + .read_folio = swap_read_folio_bdev_sync,
> + .write_folio = swap_writepage_bdev_sync,
> +};
> +
> +static struct swap_ops bdev_async_swap_ops = {
> + .read_folio = swap_read_folio_bdev_async,
> + .write_folio = swap_writepage_bdev_async,
> +};
> +
Should we have all of these as static const struct swap_ops?
> +int probe_swap_fs(struct swap_info_struct *sis)
> +{
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_FS_OPS, so the data_race
> + * is safe.
> + */
> + if (data_race(sis->flags & SWP_FS_OPS))
> + sis->ops = &bdev_fs_swap_ops;
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> + * is safe.
> + */
> + else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> + sis->ops = &bdev_sync_swap_ops;
> + else
> + sis->ops = &bdev_async_swap_ops;
> + return 0;
The return is always 0, so this function could be void.
> +}
> +
> void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> {
> struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> @@ -640,13 +661,8 @@ void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> /* We have to read from slower devices. Increase zswap protection. */
> zswap_folio_swapin(folio);
>
> - if (data_race(sis->flags & SWP_FS_OPS)) {
> - swap_read_folio_fs(folio, plug);
> - } else if (synchronous) {
> - swap_read_folio_bdev_sync(folio, sis);
> - } else {
> - swap_read_folio_bdev_async(folio, sis);
> - }
> + if (sis->ops && sis->ops->read_folio)
> + sis->ops->read_folio(sis, folio, plug);
>
> finish:
> if (workingset) {
> diff --git a/mm/swapfile.c b/mm/swapfile.c
> index 915bc93964db..af498f9af328 100644
> --- a/mm/swapfile.c
> +++ b/mm/swapfile.c
> @@ -3625,6 +3625,8 @@ SYSCALL_DEFINE2(swapon, const char __user *, specialfile, int, swap_flags)
> /* Sets SWP_WRITEOK, resurrect the percpu ref, expose the swap device */
> enable_swap_info(si);
>
> + probe_swap_fs(si);
> +
Should probe_swap_fs() be called before enable_swap_info() rather than
after it? enable_swap_info() sets SWP_WRITEOK and adds the device to
swap_active_head, making it available for allocation. At that point
si->ops is still NULL. If another CPU allocates swap from the new
device and reclaim writes to it before probe_swap_fs() runs, the
write will be silently dropped.
> pr_info("Adding %uk swap on %s. Priority:%d extents:%d across:%lluk %s%s%s%s\n",
> K(si->pages), name->name, si->prio, nr_extents,
> K((unsigned long long)span),
> diff --git a/mm/zswap.c b/mm/zswap.c
> index a399f7a10830..7ce906249c7a 100644
> --- a/mm/zswap.c
> +++ b/mm/zswap.c
> @@ -1055,7 +1055,8 @@ static int zswap_writeback_entry(struct zswap_entry *entry,
> folio_set_reclaim(folio);
>
> /* start writeback */
> - __swap_writepage(folio, NULL);
> + if (si->ops && si->ops->write_folio)
> + si->ops->write_folio(si, folio, NULL);
>
> out:
> if (ret && ret != -EEXIST) {
> --
> 2.52.0
^ permalink raw reply [flat|nested] 18+ messages in thread* Re: [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods
2026-03-02 10:40 ` [PATCH 2/3] mm/swap: use swap_ops to register swap device's methods Baoquan He
` (3 preceding siblings ...)
2026-03-02 14:53 ` Usama Arif
@ 2026-03-02 21:21 ` Nhat Pham
4 siblings, 0 replies; 18+ messages in thread
From: Nhat Pham @ 2026-03-02 21:21 UTC (permalink / raw)
To: Baoquan He
Cc: linux-mm, akpm, chrisl, kasong, shikemeng, baohua, youngjun.park
On Mon, Mar 2, 2026 at 2:40 AM Baoquan He <bhe@redhat.com> wrote:
>
> This simplifies codes and makes logic clearer. And also makes later any
> new swap device type being added easier to handle.
>
> Currently there are three types of swap devices: bdev_fs, bdev_sync
> and bdev_async, and only operations read_folio and write_folio are
> included. In the future, there could be more swap device types added
> and more appropriate opeations adapted into swap_ops.
>
> Signed-off-by: Baoquan He <bhe@redhat.com>
> ---
> include/linux/swap.h | 13 ++++++
> mm/swap.h | 1 -
> mm/swap_io.c | 102 +++++++++++++++++++++++++------------------
> mm/swapfile.c | 2 +
> mm/zswap.c | 3 +-
> 5 files changed, 76 insertions(+), 45 deletions(-)
>
> diff --git a/include/linux/swap.h b/include/linux/swap.h
> index 0effe3cc50f5..448e5e66ec5c 100644
> --- a/include/linux/swap.h
> +++ b/include/linux/swap.h
> @@ -19,6 +19,7 @@
> struct notifier_block;
>
> struct bio;
> +struct swap_iocb;
>
> struct pagevec;
>
> @@ -222,6 +223,17 @@ enum {
> #define SWAP_CLUSTER_MAX_SKIPPED (SWAP_CLUSTER_MAX << 10)
> #define COMPACT_CLUSTER_MAX SWAP_CLUSTER_MAX
>
> +struct swap_ops {
> + void (*read_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> + void (*write_folio)(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug);
> +};
> +
> +int probe_swap_fs(struct swap_info_struct *sis);
> +
> /*
> * The first page in the swap file is the swap header, which is always marked
> * bad to prevent it from being allocated as an entry. This also prevents the
> @@ -284,6 +296,7 @@ struct swap_info_struct {
> struct work_struct reclaim_work; /* reclaim worker */
> struct list_head discard_clusters; /* discard clusters list */
> struct plist_node avail_list; /* entry in swap_avail_head */
> + struct swap_ops *ops;
> };
>
> static inline swp_entry_t page_swap_entry(struct page *page)
> diff --git a/mm/swap.h b/mm/swap.h
> index 161185057993..c390df3f5889 100644
> --- a/mm/swap.h
> +++ b/mm/swap.h
> @@ -226,7 +226,6 @@ static inline void swap_read_unplug(struct swap_iocb *plug)
> }
> void swap_write_unplug(struct swap_iocb *sio);
> int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug);
> -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug);
>
> /* linux/mm/swap_state.c */
> extern struct address_space swap_space __read_mostly;
> diff --git a/mm/swap_io.c b/mm/swap_io.c
> index d1cdb10ba133..47077b345ae3 100644
> --- a/mm/swap_io.c
> +++ b/mm/swap_io.c
> @@ -240,6 +240,7 @@ static void swap_zeromap_folio_clear(struct folio *folio)
> int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> {
> int ret = 0;
> + struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
>
> if (folio_free_swap(folio))
> goto out_unlock;
> @@ -281,7 +282,8 @@ int swap_writeout(struct folio *folio, struct swap_iocb **swap_plug)
> return AOP_WRITEPAGE_ACTIVATE;
> }
>
> - __swap_writepage(folio, swap_plug);
> + if (sis->ops && sis->ops->write_folio)
> + sis->ops->write_folio(sis, folio, swap_plug);
> return 0;
> out_unlock:
> folio_unlock(folio);
> @@ -371,10 +373,11 @@ static void sio_write_complete(struct kiocb *iocb, long ret)
> mempool_free(sio, sio_pool);
> }
>
> -static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> +static void swap_writepage_fs(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **swap_plug)
> {
> struct swap_iocb *sio = swap_plug ? *swap_plug : NULL;
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> struct file *swap_file = sis->swap_file;
> loff_t pos = swap_dev_pos(folio->swap);
>
> @@ -407,8 +410,9 @@ static void swap_writepage_fs(struct folio *folio, struct swap_iocb **swap_plug)
> *swap_plug = sio;
> }
>
> -static void swap_writepage_bdev_sync(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_writepage_bdev_sync(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio_vec bv;
> struct bio bio;
> @@ -427,8 +431,9 @@ static void swap_writepage_bdev_sync(struct folio *folio,
> __end_swap_bio_write(&bio);
> }
>
> -static void swap_writepage_bdev_async(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_writepage_bdev_async(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio *bio;
>
> @@ -444,29 +449,6 @@ static void swap_writepage_bdev_async(struct folio *folio,
> submit_bio(bio);
> }
>
> -void __swap_writepage(struct folio *folio, struct swap_iocb **swap_plug)
> -{
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> -
> - VM_BUG_ON_FOLIO(!folio_test_swapcache(folio), folio);
> - /*
> - * ->flags can be updated non-atomically (scan_swap_map_slots),
> - * but that will never affect SWP_FS_OPS, so the data_race
> - * is safe.
> - */
> - if (data_race(sis->flags & SWP_FS_OPS))
> - swap_writepage_fs(folio, swap_plug);
> - /*
> - * ->flags can be updated non-atomically (scan_swap_map_slots),
> - * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> - * is safe.
> - */
> - else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> - swap_writepage_bdev_sync(folio, sis);
> - else
> - swap_writepage_bdev_async(folio, sis);
> -}
> -
> void swap_write_unplug(struct swap_iocb *sio)
> {
> struct iov_iter from;
> @@ -535,9 +517,10 @@ static bool swap_read_folio_zeromap(struct folio *folio)
> return true;
> }
>
> -static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> +static void swap_read_folio_fs(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> - struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> struct swap_iocb *sio = NULL;
> loff_t pos = swap_dev_pos(folio->swap);
>
> @@ -569,8 +552,9 @@ static void swap_read_folio_fs(struct folio *folio, struct swap_iocb **plug)
> *plug = sio;
> }
>
> -static void swap_read_folio_bdev_sync(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_read_folio_bdev_sync(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio_vec bv;
> struct bio bio;
> @@ -591,8 +575,9 @@ static void swap_read_folio_bdev_sync(struct folio *folio,
> put_task_struct(current);
> }
>
> -static void swap_read_folio_bdev_async(struct folio *folio,
> - struct swap_info_struct *sis)
> +static void swap_read_folio_bdev_async(struct swap_info_struct *sis,
> + struct folio *folio,
> + struct swap_iocb **plug)
> {
> struct bio *bio;
>
> @@ -606,6 +591,42 @@ static void swap_read_folio_bdev_async(struct folio *folio,
> submit_bio(bio);
> }
>
> +static struct swap_ops bdev_fs_swap_ops = {
> + .read_folio = swap_read_folio_fs,
> + .write_folio = swap_writepage_fs,
> +};
> +
> +static struct swap_ops bdev_sync_swap_ops = {
> + .read_folio = swap_read_folio_bdev_sync,
> + .write_folio = swap_writepage_bdev_sync,
> +};
> +
> +static struct swap_ops bdev_async_swap_ops = {
> + .read_folio = swap_read_folio_bdev_async,
> + .write_folio = swap_writepage_bdev_async,
> +};
> +
> +int probe_swap_fs(struct swap_info_struct *sis)
> +{
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_FS_OPS, so the data_race
> + * is safe.
> + */
> + if (data_race(sis->flags & SWP_FS_OPS))
> + sis->ops = &bdev_fs_swap_ops;
> + /*
> + * ->flags can be updated non-atomically (scan_swap_map_slots),
> + * but that will never affect SWP_SYNCHRONOUS_IO, so the data_race
> + * is safe.
> + */
> + else if (data_race(sis->flags & SWP_SYNCHRONOUS_IO))
> + sis->ops = &bdev_sync_swap_ops;
> + else
> + sis->ops = &bdev_async_swap_ops;
> + return 0;
> +}
> +
> void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> {
> struct swap_info_struct *sis = __swap_entry_to_info(folio->swap);
> @@ -640,13 +661,8 @@ void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
> /* We have to read from slower devices. Increase zswap protection. */
> zswap_folio_swapin(folio);
>
> - if (data_race(sis->flags & SWP_FS_OPS)) {
> - swap_read_folio_fs(folio, plug);
> - } else if (synchronous) {
> - swap_read_folio_bdev_sync(folio, sis);
> - } else {
> - swap_read_folio_bdev_async(folio, sis);
> - }
> + if (sis->ops && sis->ops->read_folio)
> + sis->ops->read_folio(sis, folio, plug);
>
> finish:
> if (workingset) {
> diff --git a/mm/swapfile.c b/mm/swapfile.c
> index 915bc93964db..af498f9af328 100644
> --- a/mm/swapfile.c
> +++ b/mm/swapfile.c
> @@ -3625,6 +3625,8 @@ SYSCALL_DEFINE2(swapon, const char __user *, specialfile, int, swap_flags)
> /* Sets SWP_WRITEOK, resurrect the percpu ref, expose the swap device */
> enable_swap_info(si);
>
> + probe_swap_fs(si);
> +
> pr_info("Adding %uk swap on %s. Priority:%d extents:%d across:%lluk %s%s%s%s\n",
> K(si->pages), name->name, si->prio, nr_extents,
> K((unsigned long long)span),
> diff --git a/mm/zswap.c b/mm/zswap.c
> index a399f7a10830..7ce906249c7a 100644
> --- a/mm/zswap.c
> +++ b/mm/zswap.c
> @@ -1055,7 +1055,8 @@ static int zswap_writeback_entry(struct zswap_entry *entry,
> folio_set_reclaim(folio);
>
> /* start writeback */
> - __swap_writepage(folio, NULL);
> + if (si->ops && si->ops->write_folio)
> + si->ops->write_folio(si, folio, NULL);
This one seems really weird to me TBH...
What's the point of a zswap writeback to a backend without writeback
operation...? We're loading the coldest zswap objects back into
memory...?
More generally, do you anticipate a swap backend with no write_folio?
I can't imagine such backend.
That said, if they exist, they should be exempted from zswap
writeback. At the very least, move this check to the beginning of
zswap_writeback_entry(), right after swap device pinning
(get_swap_device()):
1. If swap device has no writeback op, just bail. Don't even bother
allocate swap cache, decompression, etc.
2. If you anticipate that this case will never happen, add a warn.
^ permalink raw reply [flat|nested] 18+ messages in thread