release 6.15.4

2025-06-27 14:17:53 +03:00
parent 4cb7006cd5
commit 8df072e89b
90 changed files with 569 additions and 5084 deletions
--- a/debian/bin/genpatch-pf
+++ b/debian/bin/genpatch-pf
@@ -7,7 +7,7 @@ w=$(git rev-parse --path-format=absolute --show-toplevel) ; : "${w:?}" ; cd "$w"

 dst='debian/patches/tmp-pf'
 src='../linux-extras'
-branches='fixes archlinux cpuidle kbuild nfs smb xfs'
+branches='fixes archlinux cpuidle exfat kbuild nfs smb xfs'

 if [ -d "${dst}" ] ; then rm -rf "${dst}" ; fi
 mkdir -p "${dst}"
--- a/debian/changelog
+++ b/debian/changelog
@@ -1,3 +1,10 @@
+linux (6.15.4-1) sid; urgency=medium
+
+  * New upstream stable update:
+    https://www.kernel.org/pub/linux/kernel/v6.x/ChangeLog-6.15.4
+
+ -- Konstantin Demin <rockdrilla@gmail.com>  Fri, 27 Jun 2025 14:05:47 +0300
+
 linux (6.15.3-1) sid; urgency=medium

  * New upstream stable update:
--- a/debian/patches/features/all/security-perf-allow-further-restriction-of-perf_event_open.patch
+++ b/debian/patches/features/all/security-perf-allow-further-restriction-of-perf_event_open.patch
@@ -36,7 +36,7 @@ Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
 
 --- a/kernel/events/core.c
 +++ b/kernel/events/core.c
-@@ -450,8 +450,13 @@ static struct kmem_cache *perf_event_cac
+@@ -463,8 +463,13 @@ static struct kmem_cache *perf_event_cac
  *   0 - disallow raw tracepoint access for unpriv
  *   1 - disallow cpu events for unpriv
  *   2 - disallow kernel profiling for unpriv
@@ -50,7 +50,7 @@ Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
 
 /* Minimum for 512 kiB + 1 user control page. 'free' kiB per user. */
 static int sysctl_perf_event_mlock __read_mostly = 512 + (PAGE_SIZE / 1024);
-@@ -13110,6 +13115,9 @@ SYSCALL_DEFINE5(perf_event_open,
+@@ -13144,6 +13149,9 @@ SYSCALL_DEFINE5(perf_event_open,
 	if (err)
 		return err;
 
--- a/debian/patches/features/x86/intel-iommu-add-option-to-exclude-integrated-gpu-only.patch
+++ b/debian/patches/features/x86/intel-iommu-add-option-to-exclude-integrated-gpu-only.patch
@@ -68,7 +68,7 @@ Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
 		} else if (!strncmp(str, "forcedac", 8)) {
 			pr_warn("intel_iommu=forcedac deprecated; use iommu.forcedac instead\n");
 			iommu_dma_forcedac = true;
-@@ -1935,6 +1943,9 @@ static int device_def_domain_type(struct
+@@ -1936,6 +1944,9 @@ static int device_def_domain_type(struct
 
 		if ((iommu_identity_mapping & IDENTMAP_AZALIA) && IS_AZALIA(pdev))
 			return IOMMU_DOMAIN_IDENTITY;
@@ -78,7 +78,7 @@ Signed-off-by: Ben Hutchings <ben@decadent.org.uk>
 	}
 
 	return 0;
-@@ -2229,6 +2240,9 @@ static int __init init_dmars(void)
+@@ -2230,6 +2241,9 @@ static int __init init_dmars(void)
 		iommu_set_root_entry(iommu);
 	}
 
--- a/debian/patches/misc-openwrt/0002-mac80211-avoid-crashing-missing-band.patch
+++ b/debian/patches/misc-openwrt/0002-mac80211-avoid-crashing-missing-band.patch
@@ -18,7 +18,7 @@ Signed-off-by: David Bauer <mail@david-bauer.net>

 --- a/net/mac80211/sta_info.c
 +++ b/net/mac80211/sta_info.c
-@@ -2474,6 +2474,13 @@ static void sta_stats_decode_rate(struct
+@@ -2467,6 +2467,13 @@ static void sta_stats_decode_rate(struct
 
 		sband = local->hw.wiphy->bands[band];
 
--- a/debian/patches/misc-openwrt/0003-mac80211-sta-randomize-BA-session-dialog-token-alloc.patch
+++ b/debian/patches/misc-openwrt/0003-mac80211-sta-randomize-BA-session-dialog-token-alloc.patch
@@ -28,7 +28,7 @@ Signed-off-by: Johannes Berg <johannes.berg@intel.com>

 --- a/net/mac80211/sta_info.c
 +++ b/net/mac80211/sta_info.c
-@@ -583,6 +583,7 @@ __sta_info_alloc(struct ieee80211_sub_if
+@@ -582,6 +582,7 @@ __sta_info_alloc(struct ieee80211_sub_if
 	spin_lock_init(&sta->ps_lock);
 	INIT_WORK(&sta->drv_deliver_wk, sta_deliver_ps_frames);
 	wiphy_work_init(&sta->ampdu_mlme.work, ieee80211_ba_session_work);
--- a/debian/patches/misc-openwrt/0007-mac80211-increase-quantum-for-airtime-scheduler.patch
+++ b/debian/patches/misc-openwrt/0007-mac80211-increase-quantum-for-airtime-scheduler.patch
@@ -23,7 +23,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 
 --- a/net/mac80211/tx.c
 +++ b/net/mac80211/tx.c
-@@ -4084,7 +4084,7 @@ struct ieee80211_txq *ieee80211_next_txq
+@@ -4077,7 +4077,7 @@ struct ieee80211_txq *ieee80211_next_txq
 
 		if (deficit < 0)
 			sta->airtime[txqi->txq.ac].deficit +=
@@ -32,7 +32,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 
 		if (deficit < 0 || !aql_check) {
 			list_move_tail(&txqi->schedule_order,
-@@ -4227,7 +4227,8 @@ bool ieee80211_txq_may_transmit(struct i
+@@ -4220,7 +4220,8 @@ bool ieee80211_txq_may_transmit(struct i
 		}
 		sta = container_of(iter->txq.sta, struct sta_info, sta);
 		if (ieee80211_sta_deficit(sta, ac) < 0)
@@ -42,7 +42,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 		list_move_tail(&iter->schedule_order, &local->active_txqs[ac]);
 	}
 
-@@ -4235,7 +4236,7 @@ bool ieee80211_txq_may_transmit(struct i
+@@ -4228,7 +4229,7 @@ bool ieee80211_txq_may_transmit(struct i
 	if (sta->airtime[ac].deficit >= 0)
 		goto out;
 
--- a/debian/patches/misc-openwrt/0008-mac80211-add-AQL-support-for-broadcast-packets.patch
+++ b/debian/patches/misc-openwrt/0008-mac80211-add-AQL-support-for-broadcast-packets.patch
@@ -95,7 +95,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 		spin_lock_init(&local->active_txq_lock[i]);
 --- a/net/mac80211/sta_info.c
 +++ b/net/mac80211/sta_info.c
-@@ -2388,13 +2388,28 @@ EXPORT_SYMBOL(ieee80211_sta_recalc_aggre
+@@ -2381,13 +2381,28 @@ EXPORT_SYMBOL(ieee80211_sta_recalc_aggre
 
 void ieee80211_sta_update_pending_airtime(struct ieee80211_local *local,
 					  struct sta_info *sta, u8 ac,
@@ -127,7 +127,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 			atomic_add(tx_airtime,
 --- a/net/mac80211/tx.c
 +++ b/net/mac80211/tx.c
-@@ -2556,7 +2556,7 @@ static u16 ieee80211_store_ack_skb(struc
+@@ -2549,7 +2549,7 @@ static u16 ieee80211_store_ack_skb(struc
 
 		spin_lock_irqsave(&local->ack_status_lock, flags);
 		id = idr_alloc(&local->ack_status_frames, ack_skb,
@@ -136,7 +136,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 		spin_unlock_irqrestore(&local->ack_status_lock, flags);
 
 		if (id >= 0) {
-@@ -3985,20 +3985,20 @@ begin:
+@@ -3978,20 +3978,20 @@ begin:
 encap_out:
 	info->control.vif = vif;
 
@@ -167,7 +167,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 	}
 
 	return skb;
-@@ -4050,6 +4050,7 @@ struct ieee80211_txq *ieee80211_next_txq
+@@ -4043,6 +4043,7 @@ struct ieee80211_txq *ieee80211_next_txq
 	struct ieee80211_txq *ret = NULL;
 	struct txq_info *txqi = NULL, *head = NULL;
 	bool found_eligible_txq = false;
@@ -175,7 +175,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 
 	spin_lock_bh(&local->active_txq_lock[ac]);
 
-@@ -4073,26 +4074,26 @@ struct ieee80211_txq *ieee80211_next_txq
+@@ -4066,26 +4067,26 @@ struct ieee80211_txq *ieee80211_next_txq
 	if (!head)
 		head = txqi;
 
@@ -214,7 +214,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 	if (txqi->schedule_round == local->schedule_round[ac])
 		goto out;
 
-@@ -4157,7 +4158,8 @@ bool ieee80211_txq_airtime_check(struct
+@@ -4150,7 +4151,8 @@ bool ieee80211_txq_airtime_check(struct
 		return true;
 
 	if (!txq->sta)
@@ -224,7 +224,7 @@ Signed-off-by: Felix Fietkau <nbd@nbd.name>
 
 	if (unlikely(txq->tid == IEEE80211_NUM_TIDS))
 		return true;
-@@ -4206,15 +4208,15 @@ bool ieee80211_txq_may_transmit(struct i
+@@ -4199,15 +4201,15 @@ bool ieee80211_txq_may_transmit(struct i
 
 	spin_lock_bh(&local->active_txq_lock[ac]);
 
--- a/debian/patches/misc-openwrt/0009-mac80211-revert-dynamically-set-codel-parameters-per-station.patch
+++ b/debian/patches/misc-openwrt/0009-mac80211-revert-dynamically-set-codel-parameters-per-station.patch
@@ -1,221 +0,0 @@
-This reverts commit 484a54c2e597dbc4ace79c1687022282905afba0. The CoDel
-parameter change essentially disables CoDel on slow stations, with some
-questionable assumptions, as Dave pointed out in [0]. Quoting from
-there:
-
-  But here are my pithy comments as to why this part of mac80211 is so
-  wrong...
-
-   static void sta_update_codel_params(struct sta_info *sta, u32 thr)
-   {
-  -       if (thr && thr < STA_SLOW_THRESHOLD * sta->local->num_sta) {
-
-  1) sta->local->num_sta is the number of associated, rather than
-  active, stations. "Active" stations in the last 50ms or so, might have
-  been a better thing to use, but as most people have far more than that
-  associated, we end up with really lousy codel parameters, all the
-  time. Mistake numero uno!
-
-  2) The STA_SLOW_THRESHOLD was completely arbitrary in 2016.
-
-  -               sta->cparams.target = MS2TIME(50);
-
-  This, by itself, was probably not too bad. 30ms might have been
-  better, at the time, when we were battling powersave etc, but 20ms was
-  enough, really, to cover most scenarios, even where we had low rate
-  2Ghz multicast to cope with. Even then, codel has a hard time finding
-  any sane drop rate at all, with a target this high.
-
-  -               sta->cparams.interval = MS2TIME(300);
-
-  But this was horrible, a total mistake, that is leading to codel being
-  completely ineffective in almost any scenario on clients or APS.
-  100ms, even 80ms, here, would be vastly better than this insanity. I'm
-  seeing 5+seconds of delay accumulated in a bunch of otherwise happily
-  fq-ing APs....
-
-  100ms of observed jitter during a flow is enough. Certainly (in 2016)
-  there were interactions with powersave that I did not understand, and
-  still don't, but if you are transmitting in the first place, powersave
-  shouldn't be a problemmmm.....
-
-  -               sta->cparams.ecn = false;
-
-  At the time we were pretty nervous about ecn, I'm kind of sanguine
-  about it now, and reliably indicating ecn seems better than turning it
-  off for any reason.
-
-  [...]
-
-  In production, on p2p wireless, I've had 8ms and 80ms for target and
-  interval for years now, and it works great.
-
-I think Dave's arguments above are basically sound on the face of it,
-and various experimentation with tighter CoDel parameters in the OpenWrt
-community have show promising results[1]. So I don't think there's any
-reason to keep this parameter fiddling; hence this revert.
-
-[0] https://lore.kernel.org/linux-wireless/CAA93jw6NJ2cmLmMauz0xAgC2MGbBq6n0ZiZzAdkK0u4b+O2yXg@mail.gmail.com/
-[1] https://forum.openwrt.org/t/reducing-multiplexing-latencies-still-further-in-wifi/133605/130
-
-Suggested-By: Dave Taht <dave.taht@gmail.com>
-In-memory-of: Dave Taht <dave.taht@gmail.com>
-Signed-off-by: Toke Høiland-Jørgensen <toke@toke.dk>
-
--- a/include/net/mac80211.h
-+++ b/include/net/mac80211.h
-@@ -5347,22 +5347,6 @@ void ieee80211_get_tx_rates(struct ieee8
- 			    int max_rates);
- 
- /**
- * ieee80211_sta_set_expected_throughput - set the expected tpt for a station
- *
- * Call this function to notify mac80211 about a change in expected throughput
- * to a station. A driver for a device that does rate control in firmware can
- * call this function when the expected throughput estimate towards a station
- * changes. The information is used to tune the CoDel AQM applied to traffic
- * going towards that station (which can otherwise be too aggressive and cause
- * slow stations to starve).
- *
- * @pubsta: the station to set throughput for.
- * @thr: the current expected throughput in kbps.
- */
-void ieee80211_sta_set_expected_throughput(struct ieee80211_sta *pubsta,
-					   u32 thr);
-
-/**
-  * ieee80211_tx_rate_update - transmit rate update callback
-  *
-  * Drivers should call this functions with a non-NULL pub sta
--- a/net/mac80211/debugfs_sta.c
-+++ b/net/mac80211/debugfs_sta.c
-@@ -152,12 +152,6 @@ static ssize_t sta_aqm_read(struct file
- 
- 	p += scnprintf(p,
- 		       bufsz + buf - p,
-		       "target %uus interval %uus ecn %s\n",
-		       codel_time_to_us(sta->cparams.target),
-		       codel_time_to_us(sta->cparams.interval),
-		       sta->cparams.ecn ? "yes" : "no");
-	p += scnprintf(p,
-		       bufsz + buf - p,
- 		       "tid ac backlog-bytes backlog-packets new-flows drops marks overlimit collisions tx-bytes tx-packets flags\n");
- 
- 	for (i = 0; i < ARRAY_SIZE(sta->sta.txq); i++) {
--- a/net/mac80211/rate.c
-+++ b/net/mac80211/rate.c
-@@ -990,8 +990,6 @@ int rate_control_set_rates(struct ieee80
- 	if (sta->uploaded)
- 		drv_sta_rate_tbl_update(hw_to_local(hw), sta->sdata, pubsta);
- 
-	ieee80211_sta_set_expected_throughput(pubsta, sta_get_expected_throughput(sta));
-
- 	return 0;
- }
- EXPORT_SYMBOL(rate_control_set_rates);
--- a/net/mac80211/sta_info.c
-+++ b/net/mac80211/sta_info.c
-@@ -18,7 +18,6 @@
- #include <linux/timer.h>
- #include <linux/rtnetlink.h>
- 
-#include <net/codel.h>
- #include <net/mac80211.h>
- #include "ieee80211_i.h"
- #include "driver-ops.h"
-@@ -702,13 +701,6 @@ __sta_info_alloc(struct ieee80211_sub_if
- 		}
- 	}
- 
-	sta->cparams.ce_threshold = CODEL_DISABLED_THRESHOLD;
-	sta->cparams.target = MS2TIME(20);
-	sta->cparams.interval = MS2TIME(100);
-	sta->cparams.ecn = true;
-	sta->cparams.ce_threshold_selector = 0;
-	sta->cparams.ce_threshold_mask = 0;
-
- 	sta_dbg(sdata, "Allocated STA %pM\n", sta->sta.addr);
- 
- 	return sta;
-@@ -2928,27 +2920,6 @@ unsigned long ieee80211_sta_last_active(
- 	return sta->deflink.status_stats.last_ack;
- }
- 
-static void sta_update_codel_params(struct sta_info *sta, u32 thr)
-{
-	if (thr && thr < STA_SLOW_THRESHOLD * sta->local->num_sta) {
-		sta->cparams.target = MS2TIME(50);
-		sta->cparams.interval = MS2TIME(300);
-		sta->cparams.ecn = false;
-	} else {
-		sta->cparams.target = MS2TIME(20);
-		sta->cparams.interval = MS2TIME(100);
-		sta->cparams.ecn = true;
-	}
-}
-
-void ieee80211_sta_set_expected_throughput(struct ieee80211_sta *pubsta,
-					   u32 thr)
-{
-	struct sta_info *sta = container_of(pubsta, struct sta_info, sta);
-
-	sta_update_codel_params(sta, thr);
-}
-
- int ieee80211_sta_allocate_link(struct sta_info *sta, unsigned int link_id)
- {
- 	struct ieee80211_sub_if_data *sdata = sta->sdata;
--- a/net/mac80211/sta_info.h
-+++ b/net/mac80211/sta_info.h
-@@ -467,14 +467,6 @@ struct ieee80211_fragment_cache {
- 	unsigned int next;
- };
- 
-/*
- * The bandwidth threshold below which the per-station CoDel parameters will be
- * scaled to be more lenient (to prevent starvation of slow stations). This
- * value will be scaled by the number of active stations when it is being
- * applied.
- */
-#define STA_SLOW_THRESHOLD 6000 /* 6 Mbps */
-
- /**
-  * struct link_sta_info - Link STA information
-  * All link specific sta info are stored here for reference. This can be
-@@ -627,7 +619,6 @@ struct link_sta_info {
-  * @sta: station information we share with the driver
-  * @sta_state: duplicates information about station state (for debug)
-  * @rcu_head: RCU head used for freeing this station struct
- * @cparams: CoDel parameters for this station.
-  * @reserved_tid: reserved TID (if any, otherwise IEEE80211_TID_UNRESERVED)
-  * @amsdu_mesh_control: track the mesh A-MSDU format used by the peer:
-  *
-@@ -718,8 +709,6 @@ struct sta_info {
- 	struct dentry *debugfs_dir;
- #endif
- 
-	struct codel_params cparams;
-
- 	u8 reserved_tid;
- 	s8 amsdu_mesh_control;
- 
--- a/net/mac80211/tx.c
-+++ b/net/mac80211/tx.c
-@@ -1402,16 +1402,9 @@ static struct sk_buff *fq_tin_dequeue_fu
- 
- 	local = container_of(fq, struct ieee80211_local, fq);
- 	txqi = container_of(tin, struct txq_info, tin);
-+	cparams = &local->cparams;
- 	cstats = &txqi->cstats;
- 
-	if (txqi->txq.sta) {
-		struct sta_info *sta = container_of(txqi->txq.sta,
-						    struct sta_info, sta);
-		cparams = &sta->cparams;
-	} else {
-		cparams = &local->cparams;
-	}
-
- 	if (flow == &tin->default_flow)
- 		cvars = &txqi->def_cvars;
- 	else
--- a/debian/patches/misc-openwrt/0009-mac80211-txq-tune.patch
+++ b/debian/patches/misc-openwrt/0009-mac80211-txq-tune.patch
--- a/debian/patches/misc-openwrt/0010-cfg80211-aql-txq-limit.patch
+++ b/debian/patches/misc-openwrt/0010-cfg80211-aql-txq-limit.patch
--- a/debian/patches/patchset-pf/fixes/0001-Revert-Disable-FOP_DONTCACHE-for-now-due-to-bugs.patch
+++ b/debian/patches/patchset-pf/fixes/0001-Revert-Disable-FOP_DONTCACHE-for-now-due-to-bugs.patch
@@ -1,4 +1,4 @@
-From 9c2fdcdf9d8963a6fa30005a859816639d0bbf95 Mon Sep 17 00:00:00 2001
+From b3dc27f64b5d62505ae9f03a6c342a43b0b7e0b2 Mon Sep 17 00:00:00 2001
 From: Jens Axboe <axboe@kernel.dk>
 Date: Tue, 27 May 2025 07:28:54 -0600
 Subject: Revert "Disable FOP_DONTCACHE for now due to bugs"
--- a/debian/patches/patchset-pf/fixes/0001-mm-fix-ratelimit_pages-update-error-in-dirty_ratio_h.patch
+++ b/debian/patches/patchset-pf/fixes/0001-mm-fix-ratelimit_pages-update-error-in-dirty_ratio_h.patch
@@ -1,70 +0,0 @@
-From 1616d0edbdf3b36a8f4694d35bcf88fa1242c7e8 Mon Sep 17 00:00:00 2001
-From: Jinliang Zheng <alexjlzheng@tencent.com>
-Date: Tue, 15 Apr 2025 17:02:32 +0800
-Subject: mm: fix ratelimit_pages update error in dirty_ratio_handler()
-
-In dirty_ratio_handler(), vm_dirty_bytes must be set to zero before
-calling writeback_set_ratelimit(), as global_dirty_limits() always
-prioritizes the value of vm_dirty_bytes.
-
-It's domain_dirty_limits() that's relevant here, not node_dirty_ok:
-
-  dirty_ratio_handler
-    writeback_set_ratelimit
-      global_dirty_limits(&dirty_thresh)           <- ratelimit_pages based on dirty_thresh
-        domain_dirty_limits
-          if (bytes)                               <- bytes = vm_dirty_bytes <--------+
-            thresh = f1(bytes)                     <- prioritizes vm_dirty_bytes      |
-          else                                                                        |
-            thresh = f2(ratio)                                                        |
-      ratelimit_pages = f3(dirty_thresh)                                              |
-    vm_dirty_bytes = 0                             <- it's late! ---------------------+
-
-This causes ratelimit_pages to still use the value calculated based on
-vm_dirty_bytes, which is wrong now.
-
-
-The impact visible to userspace is difficult to capture directly because
-there is no procfs/sysfs interface exported to user space.  However, it
-will have a real impact on the balance of dirty pages.
-
-For example:
-
-1. On default, we have vm_dirty_ratio=40, vm_dirty_bytes=0
-
-2. echo 8192 > dirty_bytes, then vm_dirty_bytes=8192,
-   vm_dirty_ratio=0, and ratelimit_pages is calculated based on
-   vm_dirty_bytes now.
-
-3. echo 20 > dirty_ratio, then since vm_dirty_bytes is not reset to
-   zero when writeback_set_ratelimit() -> global_dirty_limits() ->
-   domain_dirty_limits() is called, reallimit_pages is still calculated
-   based on vm_dirty_bytes instead of vm_dirty_ratio.  This does not
-   conform to the actual intent of the user.
-
-Link: https://lkml.kernel.org/r/20250415090232.7544-1-alexjlzheng@tencent.com
-Fixes: 9d823e8f6b1b ("writeback: per task dirty rate limit")
-Signed-off-by: Jinliang Zheng <alexjlzheng@tencent.com>
-Reviewed-by: MengEn Sun <mengensun@tencent.com>
-Cc: Andrea Righi <andrea@betterlinux.com>
-Cc: Fenggaung Wu <fengguang.wu@intel.com>
-Cc: Jinliang Zheng <alexjlzheng@tencent.com>
-Cc: Matthew Wilcox (Oracle) <willy@infradead.org>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- mm/page-writeback.c | 2 +-
- 1 file changed, 1 insertion(+), 1 deletion(-)
-
--- a/mm/page-writeback.c
-+++ b/mm/page-writeback.c
-@@ -520,8 +520,8 @@ static int dirty_ratio_handler(const str
- 
- 	ret = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
- 	if (ret == 0 && write && vm_dirty_ratio != old_ratio) {
-		writeback_set_ratelimit();
- 		vm_dirty_bytes = 0;
-+		writeback_set_ratelimit();
- 	}
- 	return ret;
- }
--- a/debian/patches/patchset-pf/fixes/0002-mm-filemap-unify-read-write-dropbehind-naming.patch
+++ b/debian/patches/patchset-pf/fixes/0002-mm-filemap-unify-read-write-dropbehind-naming.patch
@@ -1,4 +1,4 @@
-From 0274339dc053815d099e9c336f11c1e9e5641792 Mon Sep 17 00:00:00 2001
+From 0b8d9b7ae677a03629218f69037be3f342c5ee81 Mon Sep 17 00:00:00 2001
 From: Jens Axboe <axboe@kernel.dk>
 Date: Tue, 27 May 2025 07:28:55 -0600
 Subject: mm/filemap: unify read/write dropbehind naming
--- a/debian/patches/patchset-pf/fixes/0002-vgacon-Add-check-for-vc_origin-address-range-in-vgac.patch
+++ b/debian/patches/patchset-pf/fixes/0002-vgacon-Add-check-for-vc_origin-address-range-in-vgac.patch
@@ -1,179 +0,0 @@
-From 87f7435508fde20e21c6b744723a3203e2045f46 Mon Sep 17 00:00:00 2001
-From: GONG Ruiqi <gongruiqi1@huawei.com>
-Date: Sun, 27 Apr 2025 10:53:03 +0800
-Subject: vgacon: Add check for vc_origin address range in vgacon_scroll()
-
-Our in-house Syzkaller reported the following BUG (twice), which we
-believed was the same issue with [1]:
-
-==================================================================
-BUG: KASAN: slab-out-of-bounds in vcs_scr_readw+0xc2/0xd0 drivers/tty/vt/vt.c:4740
-Read of size 2 at addr ffff88800f5bef60 by task syz.7.2620/12393
-...
-Call Trace:
- <TASK>
- __dump_stack lib/dump_stack.c:88 [inline]
- dump_stack_lvl+0x72/0xa0 lib/dump_stack.c:106
- print_address_description.constprop.0+0x6b/0x3d0 mm/kasan/report.c:364
- print_report+0xba/0x280 mm/kasan/report.c:475
- kasan_report+0xa9/0xe0 mm/kasan/report.c:588
- vcs_scr_readw+0xc2/0xd0 drivers/tty/vt/vt.c:4740
- vcs_write_buf_noattr drivers/tty/vt/vc_screen.c:493 [inline]
- vcs_write+0x586/0x840 drivers/tty/vt/vc_screen.c:690
- vfs_write+0x219/0x960 fs/read_write.c:584
- ksys_write+0x12e/0x260 fs/read_write.c:639
- do_syscall_x64 arch/x86/entry/common.c:51 [inline]
- do_syscall_64+0x59/0x110 arch/x86/entry/common.c:81
- entry_SYSCALL_64_after_hwframe+0x78/0xe2
- ...
- </TASK>
-
-Allocated by task 5614:
- kasan_save_stack+0x20/0x40 mm/kasan/common.c:45
- kasan_set_track+0x25/0x30 mm/kasan/common.c:52
- ____kasan_kmalloc mm/kasan/common.c:374 [inline]
- __kasan_kmalloc+0x8f/0xa0 mm/kasan/common.c:383
- kasan_kmalloc include/linux/kasan.h:201 [inline]
- __do_kmalloc_node mm/slab_common.c:1007 [inline]
- __kmalloc+0x62/0x140 mm/slab_common.c:1020
- kmalloc include/linux/slab.h:604 [inline]
- kzalloc include/linux/slab.h:721 [inline]
- vc_do_resize+0x235/0xf40 drivers/tty/vt/vt.c:1193
- vgacon_adjust_height+0x2d4/0x350 drivers/video/console/vgacon.c:1007
- vgacon_font_set+0x1f7/0x240 drivers/video/console/vgacon.c:1031
- con_font_set drivers/tty/vt/vt.c:4628 [inline]
- con_font_op+0x4da/0xa20 drivers/tty/vt/vt.c:4675
- vt_k_ioctl+0xa10/0xb30 drivers/tty/vt/vt_ioctl.c:474
- vt_ioctl+0x14c/0x1870 drivers/tty/vt/vt_ioctl.c:752
- tty_ioctl+0x655/0x1510 drivers/tty/tty_io.c:2779
- vfs_ioctl fs/ioctl.c:51 [inline]
- __do_sys_ioctl fs/ioctl.c:871 [inline]
- __se_sys_ioctl+0x12d/0x190 fs/ioctl.c:857
- do_syscall_x64 arch/x86/entry/common.c:51 [inline]
- do_syscall_64+0x59/0x110 arch/x86/entry/common.c:81
- entry_SYSCALL_64_after_hwframe+0x78/0xe2
-
-Last potentially related work creation:
- kasan_save_stack+0x20/0x40 mm/kasan/common.c:45
- __kasan_record_aux_stack+0x94/0xa0 mm/kasan/generic.c:492
- __call_rcu_common.constprop.0+0xc3/0xa10 kernel/rcu/tree.c:2713
- netlink_release+0x620/0xc20 net/netlink/af_netlink.c:802
- __sock_release+0xb5/0x270 net/socket.c:663
- sock_close+0x1e/0x30 net/socket.c:1425
- __fput+0x408/0xab0 fs/file_table.c:384
- __fput_sync+0x4c/0x60 fs/file_table.c:465
- __do_sys_close fs/open.c:1580 [inline]
- __se_sys_close+0x68/0xd0 fs/open.c:1565
- do_syscall_x64 arch/x86/entry/common.c:51 [inline]
- do_syscall_64+0x59/0x110 arch/x86/entry/common.c:81
- entry_SYSCALL_64_after_hwframe+0x78/0xe2
-
-Second to last potentially related work creation:
- kasan_save_stack+0x20/0x40 mm/kasan/common.c:45
- __kasan_record_aux_stack+0x94/0xa0 mm/kasan/generic.c:492
- __call_rcu_common.constprop.0+0xc3/0xa10 kernel/rcu/tree.c:2713
- netlink_release+0x620/0xc20 net/netlink/af_netlink.c:802
- __sock_release+0xb5/0x270 net/socket.c:663
- sock_close+0x1e/0x30 net/socket.c:1425
- __fput+0x408/0xab0 fs/file_table.c:384
- task_work_run+0x154/0x240 kernel/task_work.c:239
- exit_task_work include/linux/task_work.h:45 [inline]
- do_exit+0x8e5/0x1320 kernel/exit.c:874
- do_group_exit+0xcd/0x280 kernel/exit.c:1023
- get_signal+0x1675/0x1850 kernel/signal.c:2905
- arch_do_signal_or_restart+0x80/0x3b0 arch/x86/kernel/signal.c:310
- exit_to_user_mode_loop kernel/entry/common.c:111 [inline]
- exit_to_user_mode_prepare include/linux/entry-common.h:328 [inline]
- __syscall_exit_to_user_mode_work kernel/entry/common.c:207 [inline]
- syscall_exit_to_user_mode+0x1b3/0x1e0 kernel/entry/common.c:218
- do_syscall_64+0x66/0x110 arch/x86/entry/common.c:87
- entry_SYSCALL_64_after_hwframe+0x78/0xe2
-
-The buggy address belongs to the object at ffff88800f5be000
- which belongs to the cache kmalloc-2k of size 2048
-The buggy address is located 2656 bytes to the right of
- allocated 1280-byte region [ffff88800f5be000, ffff88800f5be500)
-
-...
-
-Memory state around the buggy address:
- ffff88800f5bee00: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
- ffff88800f5bee80: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
->ffff88800f5bef00: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
-                                                       ^
- ffff88800f5bef80: fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc fc
- ffff88800f5bf000: 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00 00
-==================================================================
-
-By analyzing the vmcore, we found that vc->vc_origin was somehow placed
-one line prior to vc->vc_screenbuf when vc was in KD_TEXT mode, and
-further writings to /dev/vcs caused out-of-bounds reads (and writes
-right after) in vcs_write_buf_noattr().
-
-Our further experiments show that in most cases, vc->vc_origin equals to
-vga_vram_base when the console is in KD_TEXT mode, and it's around
-vc->vc_screenbuf for the KD_GRAPHICS mode. But via triggerring a
-TIOCL_SETVESABLANK ioctl beforehand, we can make vc->vc_origin be around
-vc->vc_screenbuf while the console is in KD_TEXT mode, and then by
-writing the special 'ESC M' control sequence to the tty certain times
-(depends on the value of `vc->state.y - vc->vc_top`), we can eventually
-move vc->vc_origin prior to vc->vc_screenbuf. Here's the PoC, tested on
-QEMU:
-
-```
-int main() {
-	const int RI_NUM = 10; // should be greater than `vc->state.y - vc->vc_top`
-	int tty_fd, vcs_fd;
-	const char *tty_path = "/dev/tty0";
-	const char *vcs_path = "/dev/vcs";
-	const char escape_seq[] = "\x1bM";  // ESC + M
-	const char trigger_seq[] = "Let's trigger an OOB write.";
-	struct vt_sizes vt_size = { 70, 2 };
-	int blank = TIOCL_BLANKSCREEN;
-
-	tty_fd = open(tty_path, O_RDWR);
-
-	char vesa_mode[] = { TIOCL_SETVESABLANK, 1 };
-	ioctl(tty_fd, TIOCLINUX, vesa_mode);
-
-	ioctl(tty_fd, TIOCLINUX, &blank);
-	ioctl(tty_fd, VT_RESIZE, &vt_size);
-
-	for (int i = 0; i < RI_NUM; ++i)
-		write(tty_fd, escape_seq, sizeof(escape_seq) - 1);
-
-	vcs_fd = open(vcs_path, O_RDWR);
-	write(vcs_fd, trigger_seq, sizeof(trigger_seq));
-
-	close(vcs_fd);
-	close(tty_fd);
-	return 0;
-}
-```
-
-To solve this problem, add an address range validation check in
-vgacon_scroll(), ensuring vc->vc_origin never precedes vc_screenbuf.
-
-Reported-by: syzbot+9c09fda97a1a65ea859b@syzkaller.appspotmail.com
-Closes: https://syzkaller.appspot.com/bug?extid=9c09fda97a1a65ea859b [1]
-Fixes: 1da177e4c3f4 ("Linux-2.6.12-rc2")
-Cc: stable@vger.kernel.org
-Co-developed-by: Yi Yang <yiyang13@huawei.com>
-Signed-off-by: Yi Yang <yiyang13@huawei.com>
-Signed-off-by: GONG Ruiqi <gongruiqi1@huawei.com>
-Signed-off-by: Helge Deller <deller@gmx.de>
---
- drivers/video/console/vgacon.c | 2 +-
- 1 file changed, 1 insertion(+), 1 deletion(-)
-
--- a/drivers/video/console/vgacon.c
-+++ b/drivers/video/console/vgacon.c
-@@ -1168,7 +1168,7 @@ static bool vgacon_scroll(struct vc_data
- 				     c->vc_screenbuf_size - delta);
- 			c->vc_origin = vga_vram_end - c->vc_screenbuf_size;
- 			vga_rolled_over = 0;
-		} else
-+		} else if (oldo - delta >= (unsigned long)c->vc_screenbuf)
- 			c->vc_origin -= delta;
- 		c->vc_scr_end = c->vc_origin + c->vc_screenbuf_size;
- 		scr_memsetw((u16 *) (c->vc_origin), c->vc_video_erase_char,
--- a/debian/patches/patchset-pf/fixes/0003-fbdev-Fix-do_register_framebuffer-to-prevent-null-pt.patch
+++ b/debian/patches/patchset-pf/fixes/0003-fbdev-Fix-do_register_framebuffer-to-prevent-null-pt.patch
@@ -1,102 +0,0 @@
-From 4aed4d2a911e165342a339c886101dbe3acad5e2 Mon Sep 17 00:00:00 2001
-From: Murad Masimov <m.masimov@mt-integration.ru>
-Date: Mon, 28 Apr 2025 18:34:06 +0300
-Subject: fbdev: Fix do_register_framebuffer to prevent null-ptr-deref in
- fb_videomode_to_var
-
-If fb_add_videomode() in do_register_framebuffer() fails to allocate
-memory for fb_videomode, it will later lead to a null-ptr dereference in
-fb_videomode_to_var(), as the fb_info is registered while not having the
-mode in modelist that is expected to be there, i.e. the one that is
-described in fb_info->var.
-
-================================================================
-general protection fault, probably for non-canonical address 0xdffffc0000000001: 0000 [#1] PREEMPT SMP KASAN NOPTI
-KASAN: null-ptr-deref in range [0x0000000000000008-0x000000000000000f]
-CPU: 1 PID: 30371 Comm: syz-executor.1 Not tainted 5.10.226-syzkaller #0
-Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.12.0-1 04/01/2014
-RIP: 0010:fb_videomode_to_var+0x24/0x610 drivers/video/fbdev/core/modedb.c:901
-Call Trace:
- display_to_var+0x3a/0x7c0 drivers/video/fbdev/core/fbcon.c:929
- fbcon_resize+0x3e2/0x8f0 drivers/video/fbdev/core/fbcon.c:2071
- resize_screen drivers/tty/vt/vt.c:1176 [inline]
- vc_do_resize+0x53a/0x1170 drivers/tty/vt/vt.c:1263
- fbcon_modechanged+0x3ac/0x6e0 drivers/video/fbdev/core/fbcon.c:2720
- fbcon_update_vcs+0x43/0x60 drivers/video/fbdev/core/fbcon.c:2776
- do_fb_ioctl+0x6d2/0x740 drivers/video/fbdev/core/fbmem.c:1128
- fb_ioctl+0xe7/0x150 drivers/video/fbdev/core/fbmem.c:1203
- vfs_ioctl fs/ioctl.c:48 [inline]
- __do_sys_ioctl fs/ioctl.c:753 [inline]
- __se_sys_ioctl fs/ioctl.c:739 [inline]
- __x64_sys_ioctl+0x19a/0x210 fs/ioctl.c:739
- do_syscall_64+0x33/0x40 arch/x86/entry/common.c:46
- entry_SYSCALL_64_after_hwframe+0x67/0xd1
-================================================================
-
-Even though fbcon_init() checks beforehand if fb_match_mode() in
-var_to_display() fails, it can not prevent the panic because fbcon_init()
-does not return error code. Considering this and the comment in the code
-about fb_match_mode() returning NULL - "This should not happen" - it is
-better to prevent registering the fb_info if its mode was not set
-successfully. Also move fb_add_videomode() closer to the beginning of
-do_register_framebuffer() to avoid having to do the cleanup on fail.
-
-Found by Linux Verification Center (linuxtesting.org) with Syzkaller.
-
-Fixes: 1da177e4c3f4 ("Linux-2.6.12-rc2")
-Cc: stable@vger.kernel.org
-Signed-off-by: Murad Masimov <m.masimov@mt-integration.ru>
-Signed-off-by: Helge Deller <deller@gmx.de>
---
- drivers/video/fbdev/core/fbmem.c | 18 +++++++++++-------
- 1 file changed, 11 insertions(+), 7 deletions(-)
-
--- a/drivers/video/fbdev/core/fbmem.c
-+++ b/drivers/video/fbdev/core/fbmem.c
-@@ -388,7 +388,7 @@ static int fb_check_foreignness(struct f
- 
- static int do_register_framebuffer(struct fb_info *fb_info)
- {
-	int i;
-+	int i, err = 0;
- 	struct fb_videomode mode;
- 
- 	if (fb_check_foreignness(fb_info))
-@@ -397,10 +397,18 @@ static int do_register_framebuffer(struc
- 	if (num_registered_fb == FB_MAX)
- 		return -ENXIO;
- 
-	num_registered_fb++;
- 	for (i = 0 ; i < FB_MAX; i++)
- 		if (!registered_fb[i])
- 			break;
-+
-+	if (!fb_info->modelist.prev || !fb_info->modelist.next)
-+		INIT_LIST_HEAD(&fb_info->modelist);
-+
-+	fb_var_to_videomode(&mode, &fb_info->var);
-+	err = fb_add_videomode(&mode, &fb_info->modelist);
-+	if (err < 0)
-+		return err;
-+
- 	fb_info->node = i;
- 	refcount_set(&fb_info->count, 1);
- 	mutex_init(&fb_info->lock);
-@@ -426,16 +434,12 @@ static int do_register_framebuffer(struc
- 	if (bitmap_empty(fb_info->pixmap.blit_y, FB_MAX_BLIT_HEIGHT))
- 		bitmap_fill(fb_info->pixmap.blit_y, FB_MAX_BLIT_HEIGHT);
- 
-	if (!fb_info->modelist.prev || !fb_info->modelist.next)
-		INIT_LIST_HEAD(&fb_info->modelist);
-
- 	if (fb_info->skip_vt_switch)
- 		pm_vt_switch_required(fb_info->device, false);
- 	else
- 		pm_vt_switch_required(fb_info->device, true);
- 
-	fb_var_to_videomode(&mode, &fb_info->var);
-	fb_add_videomode(&mode, &fb_info->modelist);
-+	num_registered_fb++;
- 	registered_fb[i] = fb_info;
- 
- #ifdef CONFIG_GUMSTIX_AM200EPD
--- a/debian/patches/patchset-pf/fixes/0003-mm-filemap-unify-dropbehind-flag-testing-and-clearin.patch
+++ b/debian/patches/patchset-pf/fixes/0003-mm-filemap-unify-dropbehind-flag-testing-and-clearin.patch
@@ -1,4 +1,4 @@
-From de09560d2e6fbb14ea586063217277e5ebc1bc71 Mon Sep 17 00:00:00 2001
+From 2c1c3b3aafb153cbc3bd298db57cc7313d1601b1 Mon Sep 17 00:00:00 2001
 From: Jens Axboe <axboe@kernel.dk>
 Date: Tue, 27 May 2025 07:28:56 -0600
 Subject: mm/filemap: unify dropbehind flag testing and clearing
--- a/debian/patches/patchset-pf/fixes/0004-fbdev-Fix-fb_set_var-to-prevent-null-ptr-deref-in-fb.patch
+++ b/debian/patches/patchset-pf/fixes/0004-fbdev-Fix-fb_set_var-to-prevent-null-ptr-deref-in-fb.patch
@@ -1,65 +0,0 @@
-From 10c7fce24a1ad9197a8eabbba454a9a872f03d5c Mon Sep 17 00:00:00 2001
-From: Murad Masimov <m.masimov@mt-integration.ru>
-Date: Mon, 28 Apr 2025 18:34:07 +0300
-Subject: fbdev: Fix fb_set_var to prevent null-ptr-deref in
- fb_videomode_to_var
-
-If fb_add_videomode() in fb_set_var() fails to allocate memory for
-fb_videomode, later it may lead to a null-ptr dereference in
-fb_videomode_to_var(), as the fb_info is registered while not having the
-mode in modelist that is expected to be there, i.e. the one that is
-described in fb_info->var.
-
-================================================================
-general protection fault, probably for non-canonical address 0xdffffc0000000001: 0000 [#1] PREEMPT SMP KASAN NOPTI
-KASAN: null-ptr-deref in range [0x0000000000000008-0x000000000000000f]
-CPU: 1 PID: 30371 Comm: syz-executor.1 Not tainted 5.10.226-syzkaller #0
-Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.12.0-1 04/01/2014
-RIP: 0010:fb_videomode_to_var+0x24/0x610 drivers/video/fbdev/core/modedb.c:901
-Call Trace:
- display_to_var+0x3a/0x7c0 drivers/video/fbdev/core/fbcon.c:929
- fbcon_resize+0x3e2/0x8f0 drivers/video/fbdev/core/fbcon.c:2071
- resize_screen drivers/tty/vt/vt.c:1176 [inline]
- vc_do_resize+0x53a/0x1170 drivers/tty/vt/vt.c:1263
- fbcon_modechanged+0x3ac/0x6e0 drivers/video/fbdev/core/fbcon.c:2720
- fbcon_update_vcs+0x43/0x60 drivers/video/fbdev/core/fbcon.c:2776
- do_fb_ioctl+0x6d2/0x740 drivers/video/fbdev/core/fbmem.c:1128
- fb_ioctl+0xe7/0x150 drivers/video/fbdev/core/fbmem.c:1203
- vfs_ioctl fs/ioctl.c:48 [inline]
- __do_sys_ioctl fs/ioctl.c:753 [inline]
- __se_sys_ioctl fs/ioctl.c:739 [inline]
- __x64_sys_ioctl+0x19a/0x210 fs/ioctl.c:739
- do_syscall_64+0x33/0x40 arch/x86/entry/common.c:46
- entry_SYSCALL_64_after_hwframe+0x67/0xd1
-================================================================
-
-The reason is that fb_info->var is being modified in fb_set_var(), and
-then fb_videomode_to_var() is called. If it fails to add the mode to
-fb_info->modelist, fb_set_var() returns error, but does not restore the
-old value of fb_info->var. Restore fb_info->var on failure the same way
-it is done earlier in the function.
-
-Found by Linux Verification Center (linuxtesting.org) with Syzkaller.
-
-Fixes: 1da177e4c3f4 ("Linux-2.6.12-rc2")
-Cc: stable@vger.kernel.org
-Signed-off-by: Murad Masimov <m.masimov@mt-integration.ru>
-Signed-off-by: Helge Deller <deller@gmx.de>
---
- drivers/video/fbdev/core/fbmem.c | 4 +++-
- 1 file changed, 3 insertions(+), 1 deletion(-)
-
--- a/drivers/video/fbdev/core/fbmem.c
-+++ b/drivers/video/fbdev/core/fbmem.c
-@@ -328,8 +328,10 @@ fb_set_var(struct fb_info *info, struct
- 	    !list_empty(&info->modelist))
- 		ret = fb_add_videomode(&mode, &info->modelist);
- 
-	if (ret)
-+	if (ret) {
-+		info->var = old_var;
- 		return ret;
-+	}
- 
- 	event.info = info;
- 	event.data = &mode;
--- a/debian/patches/patchset-pf/fixes/0004-mm-khugepaged-fix-race-with-folio-split-free-using-t.patch
+++ b/debian/patches/patchset-pf/fixes/0004-mm-khugepaged-fix-race-with-folio-split-free-using-t.patch
@@ -1,4 +1,4 @@
-From c041325f222c774573ad73d35939451a4e221e52 Mon Sep 17 00:00:00 2001
+From 61d27e9dadb2eb2b7596a11a37402452d97625f7 Mon Sep 17 00:00:00 2001
 From: Shivank Garg <shivankg@amd.com>
 Date: Mon, 26 May 2025 18:28:18 +0000
 Subject: mm/khugepaged: fix race with folio split/free using temporary
--- a/debian/patches/patchset-pf/fixes/0005-anon_inode-use-a-proper-mode-internally.patch
+++ b/debian/patches/patchset-pf/fixes/0005-anon_inode-use-a-proper-mode-internally.patch
@@ -1,113 +0,0 @@
-From 13ccad7713b89e7693feb5346e7893dc8edce7a8 Mon Sep 17 00:00:00 2001
-From: Christian Brauner <brauner@kernel.org>
-Date: Mon, 7 Apr 2025 11:54:15 +0200
-Subject: anon_inode: use a proper mode internally
-
-This allows the VFS to not trip over anonymous inodes and we can add
-asserts based on the mode into the vfs. When we report it to userspace
-we can simply hide the mode to avoid regressions. I've audited all
-direct callers of alloc_anon_inode() and only secretmen overrides i_mode
-and i_op inode operations but it already uses a regular file.
-
-Link: https://lore.kernel.org/20250407-work-anon_inode-v1-1-53a44c20d44e@kernel.org
-Fixes: af153bb63a336 ("vfs: catch invalid modes in may_open()")
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Cc: stable@vger.kernel.org # all LTS kernels
-Reported-by: syzbot+5d8e79d323a13aa0b248@syzkaller.appspotmail.com
-Closes: https://lore.kernel.org/all/67ed3fb3.050a0220.14623d.0009.GAE@google.com
-Signed-off-by: Christian Brauner <brauner@kernel.org>
---
- fs/anon_inodes.c | 36 ++++++++++++++++++++++++++++++++++++
- fs/internal.h    |  3 +++
- fs/libfs.c       |  8 +++++++-
- 3 files changed, 46 insertions(+), 1 deletion(-)
-
--- a/fs/anon_inodes.c
-+++ b/fs/anon_inodes.c
-@@ -24,10 +24,44 @@
- 
- #include <linux/uaccess.h>
- 
-+#include "internal.h"
-+
- static struct vfsmount *anon_inode_mnt __ro_after_init;
- static struct inode *anon_inode_inode __ro_after_init;
- 
- /*
-+ * User space expects anonymous inodes to have no file type in st_mode.
-+ *
-+ * In particular, 'lsof' has this legacy logic:
-+ *
-+ *	type = s->st_mode & S_IFMT;
-+ *	switch (type) {
-+ *	  ...
-+ *	case 0:
-+ *		if (!strcmp(p, "anon_inode"))
-+ *			Lf->ntype = Ntype = N_ANON_INODE;
-+ *
-+ * to detect our old anon_inode logic.
-+ *
-+ * Rather than mess with our internal sane inode data, just fix it
-+ * up here in getattr() by masking off the format bits.
-+ */
-+int anon_inode_getattr(struct mnt_idmap *idmap, const struct path *path,
-+		       struct kstat *stat, u32 request_mask,
-+		       unsigned int query_flags)
-+{
-+	struct inode *inode = d_inode(path->dentry);
-+
-+	generic_fillattr(&nop_mnt_idmap, request_mask, inode, stat);
-+	stat->mode &= ~S_IFMT;
-+	return 0;
-+}
-+
-+static const struct inode_operations anon_inode_operations = {
-+	.getattr = anon_inode_getattr,
-+};
-+
-+/*
-  * anon_inodefs_dname() is called from d_path().
-  */
- static char *anon_inodefs_dname(struct dentry *dentry, char *buffer, int buflen)
-@@ -66,6 +100,7 @@ static struct inode *anon_inode_make_sec
- 	if (IS_ERR(inode))
- 		return inode;
- 	inode->i_flags &= ~S_PRIVATE;
-+	inode->i_op = &anon_inode_operations;
- 	error =	security_inode_init_security_anon(inode, &QSTR(name),
- 						  context_inode);
- 	if (error) {
-@@ -313,6 +348,7 @@ static int __init anon_inode_init(void)
- 	anon_inode_inode = alloc_anon_inode(anon_inode_mnt->mnt_sb);
- 	if (IS_ERR(anon_inode_inode))
- 		panic("anon_inode_init() inode allocation failed (%ld)\n", PTR_ERR(anon_inode_inode));
-+	anon_inode_inode->i_op = &anon_inode_operations;
- 
- 	return 0;
- }
--- a/fs/internal.h
-+++ b/fs/internal.h
-@@ -343,3 +343,6 @@ static inline bool path_mounted(const st
- void file_f_owner_release(struct file *file);
- bool file_seek_cur_needs_f_lock(struct file *file);
- int statmount_mnt_idmap(struct mnt_idmap *idmap, struct seq_file *seq, bool uid_map);
-+int anon_inode_getattr(struct mnt_idmap *idmap, const struct path *path,
-+		       struct kstat *stat, u32 request_mask,
-+		       unsigned int query_flags);
--- a/fs/libfs.c
-+++ b/fs/libfs.c
-@@ -1647,7 +1647,13 @@ struct inode *alloc_anon_inode(struct su
- 	 * that it already _is_ on the dirty list.
- 	 */
- 	inode->i_state = I_DIRTY;
-	inode->i_mode = S_IRUSR | S_IWUSR;
-+	/*
-+	 * Historically anonymous inodes didn't have a type at all and
-+	 * userspace has come to rely on this. Internally they're just
-+	 * regular files but S_IFREG is masked off when reporting
-+	 * information to userspace.
-+	 */
-+	inode->i_mode = S_IFREG | S_IRUSR | S_IWUSR;
- 	inode->i_uid = current_fsuid();
- 	inode->i_gid = current_fsgid();
- 	inode->i_flags |= S_PRIVATE;
--- a/debian/patches/patchset-pf/fixes/0005-mm-add-folio_expected_ref_count-for-reference-count-.patch
+++ b/debian/patches/patchset-pf/fixes/0005-mm-add-folio_expected_ref_count-for-reference-count-.patch
@@ -1,4 +1,4 @@
-From 76653593bdf5fda03717991681b5d60e2af015e9 Mon Sep 17 00:00:00 2001
+From 8135974e9e512fdf6d15f59947f95e44f2834c37 Mon Sep 17 00:00:00 2001
 From: Shivank Garg <shivankg@amd.com>
 Date: Wed, 30 Apr 2025 10:01:51 +0000
 Subject: mm: add folio_expected_ref_count() for reference count calculation
--- a/debian/patches/patchset-pf/fixes/0006-anon_inode-explicitly-block-setattr.patch
+++ b/debian/patches/patchset-pf/fixes/0006-anon_inode-explicitly-block-setattr.patch
@@ -1,80 +0,0 @@
-From 5a3eea2c3e9675a8b713eef0d52b7c437f1f613b Mon Sep 17 00:00:00 2001
-From: Christian Brauner <brauner@kernel.org>
-Date: Mon, 7 Apr 2025 11:54:17 +0200
-Subject: anon_inode: explicitly block ->setattr()
-
-It is currently possible to change the mode and owner of the single
-anonymous inode in the kernel:
-
-int main(int argc, char *argv[])
-{
-        int ret, sfd;
-        sigset_t mask;
-        struct signalfd_siginfo fdsi;
-
-        sigemptyset(&mask);
-        sigaddset(&mask, SIGINT);
-        sigaddset(&mask, SIGQUIT);
-
-        ret = sigprocmask(SIG_BLOCK, &mask, NULL);
-        if (ret < 0)
-                _exit(1);
-
-        sfd = signalfd(-1, &mask, 0);
-        if (sfd < 0)
-                _exit(2);
-
-        ret = fchown(sfd, 5555, 5555);
-        if (ret < 0)
-                _exit(3);
-
-        ret = fchmod(sfd, 0777);
-        if (ret < 0)
-                _exit(3);
-
-        _exit(4);
-}
-
-This is a bug. It's not really a meaningful one because anonymous inodes
-don't really figure into path lookup and they cannot be reopened via
-/proc/<pid>/fd/<nr> and can't be used for lookup itself. So they can
-only ever serve as direct references.
-
-But it is still completely bogus to allow the mode and ownership or any
-of the properties of the anonymous inode to be changed. Block this!
-
-Link: https://lore.kernel.org/20250407-work-anon_inode-v1-3-53a44c20d44e@kernel.org
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Cc: stable@vger.kernel.org # all LTS kernels
-Signed-off-by: Christian Brauner <brauner@kernel.org>
---
- fs/anon_inodes.c | 7 +++++++
- fs/internal.h    | 2 ++
- 2 files changed, 9 insertions(+)
-
--- a/fs/anon_inodes.c
-+++ b/fs/anon_inodes.c
-@@ -57,8 +57,15 @@ int anon_inode_getattr(struct mnt_idmap
- 	return 0;
- }
- 
-+int anon_inode_setattr(struct mnt_idmap *idmap, struct dentry *dentry,
-+		       struct iattr *attr)
-+{
-+	return -EOPNOTSUPP;
-+}
-+
- static const struct inode_operations anon_inode_operations = {
- 	.getattr = anon_inode_getattr,
-+	.setattr = anon_inode_setattr,
- };
- 
- /*
--- a/fs/internal.h
-+++ b/fs/internal.h
-@@ -346,3 +346,5 @@ int statmount_mnt_idmap(struct mnt_idmap
- int anon_inode_getattr(struct mnt_idmap *idmap, const struct path *path,
- 		       struct kstat *stat, u32 request_mask,
- 		       unsigned int query_flags);
-+int anon_inode_setattr(struct mnt_idmap *idmap, struct dentry *dentry,
-+		       struct iattr *attr);
--- a/debian/patches/patchset-zen/fixes/0003-drm-i915-snps_hdmi_pll-Fix-64-bit-divisor-truncation.patch
+++ b/debian/patches/patchset-zen/fixes/0003-drm-i915-snps_hdmi_pll-Fix-64-bit-divisor-truncation.patch
@@ -1,4 +1,4 @@
-From 96e19aa45a528ce5c722f1925d750f74efe22a8b Mon Sep 17 00:00:00 2001
+From 3d1a493525955678c231ab7ccf0950c0ba2b9f45 Mon Sep 17 00:00:00 2001
 From: Ankit Nautiyal <ankit.k.nautiyal@intel.com>
 Date: Fri, 13 Jun 2025 11:42:46 +0530
 Subject: drm/i915/snps_hdmi_pll: Fix 64-bit divisor truncation by using
--- a/debian/patches/patchset-pf/fixes/0007-anon_inode-raise-SB_I_NODEV-and-SB_I_NOEXEC.patch
+++ b/debian/patches/patchset-pf/fixes/0007-anon_inode-raise-SB_I_NODEV-and-SB_I_NOEXEC.patch
@@ -1,39 +0,0 @@
-From 8c9775d285f9755477a8b1f8b215102dce014ed2 Mon Sep 17 00:00:00 2001
-From: Christian Brauner <brauner@kernel.org>
-Date: Mon, 7 Apr 2025 11:54:19 +0200
-Subject: anon_inode: raise SB_I_NODEV and SB_I_NOEXEC
-
-It isn't possible to execute anonymous inodes because they cannot be
-opened in any way after they have been created. This includes execution:
-
-execveat(fd_anon_inode, "", NULL, NULL, AT_EMPTY_PATH)
-
-Anonymous inodes have inode->f_op set to no_open_fops which sets
-no_open() which returns ENXIO. That means any call to do_dentry_open()
-which is the endpoint of the do_open_execat() will fail. There's no
-chance to execute an anonymous inode. Unless a given subsystem overrides
-it ofc.
-
-However, we should still harden this and raise SB_I_NODEV and
-SB_I_NOEXEC on the superblock itself so that no one gets any creative
-ideas.
-
-Link: https://lore.kernel.org/20250407-work-anon_inode-v1-5-53a44c20d44e@kernel.org
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Cc: stable@vger.kernel.org # all LTS kernels
-Signed-off-by: Christian Brauner <brauner@kernel.org>
---
- fs/anon_inodes.c | 2 ++
- 1 file changed, 2 insertions(+)
-
--- a/fs/anon_inodes.c
-+++ b/fs/anon_inodes.c
-@@ -86,6 +86,8 @@ static int anon_inodefs_init_fs_context(
- 	struct pseudo_fs_context *ctx = init_pseudo(fc, ANON_INODE_FS_MAGIC);
- 	if (!ctx)
- 		return -ENOMEM;
-+	fc->s_iflags |= SB_I_NOEXEC;
-+	fc->s_iflags |= SB_I_NODEV;
- 	ctx->dops = &anon_inodefs_dentry_operations;
- 	return 0;
- }
--- a/debian/patches/patchset-pf/fixes/0007-mm-shmem-swap-fix-softlockup-with-mTHP-swapin.patch
+++ b/debian/patches/patchset-pf/fixes/0007-mm-shmem-swap-fix-softlockup-with-mTHP-swapin.patch
@@ -0,0 +1,190 @@
+From 3a317593ed60909e02e059a43b2ef588f95fd457 Mon Sep 17 00:00:00 2001
+From: Kairui Song <kasong@tencent.com>
+Date: Tue, 10 Jun 2025 01:17:51 +0800
+Subject: mm/shmem, swap: fix softlockup with mTHP swapin
+MIME-Version: 1.0
+Content-Type: text/plain; charset=UTF-8
+Content-Transfer-Encoding: 8bit
+
+Following softlockup can be easily reproduced on my test machine with:
+
+echo always > /sys/kernel/mm/transparent_hugepage/hugepages-64kB/enabled
+swapon /dev/zram0 # zram0 is a 48G swap device
+mkdir -p /sys/fs/cgroup/memory/test
+echo 1G > /sys/fs/cgroup/test/memory.max
+echo $BASHPID > /sys/fs/cgroup/test/cgroup.procs
+while true; do
+    dd if=/dev/zero of=/tmp/test.img bs=1M count=5120
+    cat /tmp/test.img > /dev/null
+    rm /tmp/test.img
+done
+
+Then after a while:
+watchdog: BUG: soft lockup - CPU#0 stuck for 763s! [cat:5787]
+Modules linked in: zram virtiofs
+CPU: 0 UID: 0 PID: 5787 Comm: cat Kdump: loaded Tainted: G             L      6.15.0.orig-gf3021d9246bc-dirty #118 PREEMPT(voluntary)·
+Tainted: [L]=SOFTLOCKUP
+Hardware name: Red Hat KVM/RHEL-AV, BIOS 0.0.0 02/06/2015
+RIP: 0010:mpol_shared_policy_lookup+0xd/0x70
+Code: e9 b8 b4 ff ff 31 c0 c3 cc cc cc cc 90 90 90 90 90 90 90 90 90 90 90 90 90 90 90 90 90 66 0f 1f 00 0f 1f 44 00 00 41 54 55 53 <48> 8b 1f 48 85 db 74 41 4c 8d 67 08 48 89 fb 48 89 f5 4c 89 e7 e8
+RSP: 0018:ffffc90002b1fc28 EFLAGS: 00000202
+RAX: 00000000001c20ca RBX: 0000000000724e1e RCX: 0000000000000001
+RDX: ffff888118e214c8 RSI: 0000000000057d42 RDI: ffff888118e21518
+RBP: 000000000002bec8 R08: 0000000000000001 R09: 0000000000000000
+R10: 0000000000000bf4 R11: 0000000000000000 R12: 0000000000000001
+R13: 00000000001c20ca R14: 00000000001c20ca R15: 0000000000000000
+FS:  00007f03f995c740(0000) GS:ffff88a07ad9a000(0000) knlGS:0000000000000000
+CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
+CR2: 00007f03f98f1000 CR3: 0000000144626004 CR4: 0000000000770eb0
+DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
+DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
+PKRU: 55555554
+Call Trace:
+ <TASK>
+ shmem_alloc_folio+0x31/0xc0
+ shmem_swapin_folio+0x309/0xcf0
+ ? filemap_get_entry+0x117/0x1e0
+ ? xas_load+0xd/0xb0
+ ? filemap_get_entry+0x101/0x1e0
+ shmem_get_folio_gfp+0x2ed/0x5b0
+ shmem_file_read_iter+0x7f/0x2e0
+ vfs_read+0x252/0x330
+ ksys_read+0x68/0xf0
+ do_syscall_64+0x4c/0x1c0
+ entry_SYSCALL_64_after_hwframe+0x76/0x7e
+RIP: 0033:0x7f03f9a46991
+Code: 00 48 8b 15 81 14 10 00 f7 d8 64 89 02 b8 ff ff ff ff eb bd e8 20 ad 01 00 f3 0f 1e fa 80 3d 35 97 10 00 00 74 13 31 c0 0f 05 <48> 3d 00 f0 ff ff 77 4f c3 66 0f 1f 44 00 00 55 48 89 e5 48 83 ec
+RSP: 002b:00007fff3c52bd28 EFLAGS: 00000246 ORIG_RAX: 0000000000000000
+RAX: ffffffffffffffda RBX: 0000000000040000 RCX: 00007f03f9a46991
+RDX: 0000000000040000 RSI: 00007f03f98ba000 RDI: 0000000000000003
+RBP: 00007fff3c52bd50 R08: 0000000000000000 R09: 00007f03f9b9a380
+R10: 0000000000000022 R11: 0000000000000246 R12: 0000000000040000
+R13: 00007f03f98ba000 R14: 0000000000000003 R15: 0000000000000000
+ </TASK>
+
+The reason is simple, readahead brought some order 0 folio in swap cache,
+and the swapin mTHP folio being allocated is in conflict with it, so
+swapcache_prepare fails and causes shmem_swap_alloc_folio to return
+-EEXIST, and shmem simply retries again and again causing this loop.
+
+Fix it by applying a similar fix for anon mTHP swapin.
+
+The performance change is very slight, time of swapin 10g zero folios
+with shmem (test for 12 times):
+Before:  2.47s
+After:   2.48s
+
+[kasong@tencent.com: add comment]
+  Link: https://lkml.kernel.org/r/20250610181645.45922-1-ryncsn@gmail.com
+Link: https://lkml.kernel.org/r/20250610181645.45922-1-ryncsn@gmail.com
+Link: https://lkml.kernel.org/r/20250609171751.36305-1-ryncsn@gmail.com
+Fixes: 1dd44c0af4fa ("mm: shmem: skip swapcache for swapin of synchronous swap device")
+Signed-off-by: Kairui Song <kasong@tencent.com>
+Reviewed-by: Barry Song <baohua@kernel.org>
+Acked-by: Nhat Pham <nphamcs@gmail.com>
+Reviewed-by: Baolin Wang <baolin.wang@linux.alibaba.com>
+Cc: Baoquan He <bhe@redhat.com>
+Cc: Chris Li <chrisl@kernel.org>
+Cc: Hugh Dickins <hughd@google.com>
+Cc: Kemeng Shi <shikemeng@huaweicloud.com>
+Cc: Usama Arif <usamaarif642@gmail.com>
+Cc: <stable@vger.kernel.org>
+Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
+---
+ mm/memory.c | 20 --------------------
+ mm/shmem.c  |  6 +++++-
+ mm/swap.h   | 23 +++++++++++++++++++++++
+ 3 files changed, 28 insertions(+), 21 deletions(-)
+
+--- a/mm/memory.c
+++ b/mm/memory.c
+@@ -4225,26 +4225,6 @@ static struct folio *__alloc_swap_folio(
+ }
+ 
+ #ifdef CONFIG_TRANSPARENT_HUGEPAGE
+-static inline int non_swapcache_batch(swp_entry_t entry, int max_nr)
+-{
+-	struct swap_info_struct *si = swp_swap_info(entry);
+-	pgoff_t offset = swp_offset(entry);
+-	int i;
+-
+-	/*
+-	 * While allocating a large folio and doing swap_read_folio, which is
+-	 * the case the being faulted pte doesn't have swapcache. We need to
+-	 * ensure all PTEs have no cache as well, otherwise, we might go to
+-	 * swap devices while the content is in swapcache.
+-	 */
+-	for (i = 0; i < max_nr; i++) {
+-		if ((si->swap_map[offset + i] & SWAP_HAS_CACHE))
+-			return i;
+-	}
+-
+-	return i;
+-}
+-
+ /*
+  * Check if the PTEs within a range are contiguous swap entries
+  * and have consistent swapcache, zeromap.
+--- a/mm/shmem.c
+++ b/mm/shmem.c
+@@ -2262,6 +2262,7 @@ static int shmem_swapin_folio(struct ino
+ 	folio = swap_cache_get_folio(swap, NULL, 0);
+ 	order = xa_get_order(&mapping->i_pages, index);
+ 	if (!folio) {
+		int nr_pages = 1 << order;
+ 		bool fallback_order0 = false;
+ 
+ 		/* Or update major stats only when swapin succeeds?? */
+@@ -2275,9 +2276,12 @@ static int shmem_swapin_folio(struct ino
+ 		 * If uffd is active for the vma, we need per-page fault
+ 		 * fidelity to maintain the uffd semantics, then fallback
+ 		 * to swapin order-0 folio, as well as for zswap case.
+		 * Any existing sub folio in the swap cache also blocks
+		 * mTHP swapin.
+ 		 */
+ 		if (order > 0 && ((vma && unlikely(userfaultfd_armed(vma))) ||
+-				  !zswap_never_enabled()))
+				  !zswap_never_enabled() ||
+				  non_swapcache_batch(swap, nr_pages) != nr_pages))
+ 			fallback_order0 = true;
+ 
+ 		/* Skip swapcache for synchronous device. */
+--- a/mm/swap.h
+++ b/mm/swap.h
+@@ -106,6 +106,25 @@ static inline int swap_zeromap_batch(swp
+ 		return find_next_bit(sis->zeromap, end, start) - start;
+ }
+ 
+static inline int non_swapcache_batch(swp_entry_t entry, int max_nr)
+{
+	struct swap_info_struct *si = swp_swap_info(entry);
+	pgoff_t offset = swp_offset(entry);
+	int i;
+
+	/*
+	 * While allocating a large folio and doing mTHP swapin, we need to
+	 * ensure all entries are not cached, otherwise, the mTHP folio will
+	 * be in conflict with the folio in swap cache.
+	 */
+	for (i = 0; i < max_nr; i++) {
+		if ((si->swap_map[offset + i] & SWAP_HAS_CACHE))
+			return i;
+	}
+
+	return i;
+}
+
+ #else /* CONFIG_SWAP */
+ struct swap_iocb;
+ static inline void swap_read_folio(struct folio *folio, struct swap_iocb **plug)
+@@ -199,6 +218,10 @@ static inline int swap_zeromap_batch(swp
+ 	return 0;
+ }
+ 
+static inline int non_swapcache_batch(swp_entry_t entry, int max_nr)
+{
+	return 0;
+}
+ #endif /* CONFIG_SWAP */
+ 
+ #endif /* _MM_SWAP_H */
--- a/debian/patches/patchset-pf/fixes/0008-fs-add-S_ANON_INODE.patch
+++ b/debian/patches/patchset-pf/fixes/0008-fs-add-S_ANON_INODE.patch
@@ -1,136 +0,0 @@
-From d90681a50098e204f2e111b9433f6fc73a939854 Mon Sep 17 00:00:00 2001
-From: Christian Brauner <brauner@kernel.org>
-Date: Mon, 21 Apr 2025 10:27:40 +0200
-Subject: fs: add S_ANON_INODE
-
-This makes it easy to detect proper anonymous inodes and to ensure that
-we can detect them in codepaths such as readahead().
-
-Readahead on anonymous inodes didn't work because they didn't have a
-proper mode. Now that they have we need to retain EINVAL being returned
-otherwise LTP will fail.
-
-We also need to ensure that ioctls aren't simply fired like they are for
-regular files so things like inotify inodes continue to correctly call
-their own ioctl handlers as in [1].
-
-Reported-by: Xilin Wu <sophon@radxa.com>
-Link: https://lore.kernel.org/3A9139D5CD543962+89831381-31b9-4392-87ec-a84a5b3507d8@radxa.com [1]
-Link: https://lore.kernel.org/7a1a7076-ff6b-4cb0-94e7-7218a0a44028@sirena.org.uk
-Signed-off-by: Christian Brauner <brauner@kernel.org>
---
- fs/ioctl.c         |  7 ++++---
- fs/libfs.c         |  2 +-
- fs/pidfs.c         |  2 +-
- include/linux/fs.h |  2 ++
- mm/readahead.c     | 20 ++++++++++++++++----
- 5 files changed, 24 insertions(+), 9 deletions(-)
-
--- a/fs/ioctl.c
-+++ b/fs/ioctl.c
-@@ -821,7 +821,8 @@ static int do_vfs_ioctl(struct file *fil
- 		return ioctl_fioasync(fd, filp, argp);
- 
- 	case FIOQSIZE:
-		if (S_ISDIR(inode->i_mode) || S_ISREG(inode->i_mode) ||
-+		if (S_ISDIR(inode->i_mode) ||
-+		    (S_ISREG(inode->i_mode) && !IS_ANON_FILE(inode)) ||
- 		    S_ISLNK(inode->i_mode)) {
- 			loff_t res = inode_get_bytes(inode);
- 			return copy_to_user(argp, &res, sizeof(res)) ?
-@@ -856,7 +857,7 @@ static int do_vfs_ioctl(struct file *fil
- 		return ioctl_file_dedupe_range(filp, argp);
- 
- 	case FIONREAD:
-		if (!S_ISREG(inode->i_mode))
-+		if (!S_ISREG(inode->i_mode) || IS_ANON_FILE(inode))
- 			return vfs_ioctl(filp, cmd, arg);
- 
- 		return put_user(i_size_read(inode) - filp->f_pos,
-@@ -881,7 +882,7 @@ static int do_vfs_ioctl(struct file *fil
- 		return ioctl_get_fs_sysfs_path(filp, argp);
- 
- 	default:
-		if (S_ISREG(inode->i_mode))
-+		if (S_ISREG(inode->i_mode) && !IS_ANON_FILE(inode))
- 			return file_ioctl(filp, cmd, argp);
- 		break;
- 	}
--- a/fs/libfs.c
-+++ b/fs/libfs.c
-@@ -1656,7 +1656,7 @@ struct inode *alloc_anon_inode(struct su
- 	inode->i_mode = S_IFREG | S_IRUSR | S_IWUSR;
- 	inode->i_uid = current_fsuid();
- 	inode->i_gid = current_fsgid();
-	inode->i_flags |= S_PRIVATE;
-+	inode->i_flags |= S_PRIVATE | S_ANON_INODE;
- 	simple_inode_init_ts(inode);
- 	return inode;
- }
--- a/fs/pidfs.c
-+++ b/fs/pidfs.c
-@@ -826,7 +826,7 @@ static int pidfs_init_inode(struct inode
- 	const struct pid *pid = data;
- 
- 	inode->i_private = data;
-	inode->i_flags |= S_PRIVATE;
-+	inode->i_flags |= S_PRIVATE | S_ANON_INODE;
- 	inode->i_mode |= S_IRWXU;
- 	inode->i_op = &pidfs_inode_operations;
- 	inode->i_fop = &pidfs_file_operations;
--- a/include/linux/fs.h
-+++ b/include/linux/fs.h
-@@ -2344,6 +2344,7 @@ struct super_operations {
- #define S_CASEFOLD	(1 << 15) /* Casefolded file */
- #define S_VERITY	(1 << 16) /* Verity file (using fs/verity/) */
- #define S_KERNEL_FILE	(1 << 17) /* File is in use by the kernel (eg. fs/cachefiles) */
-+#define S_ANON_INODE	(1 << 19) /* Inode is an anonymous inode */
- 
- /*
-  * Note that nosuid etc flags are inode-specific: setting some file-system
-@@ -2400,6 +2401,7 @@ static inline bool sb_rdonly(const struc
- 
- #define IS_WHITEOUT(inode)	(S_ISCHR(inode->i_mode) && \
- 				 (inode)->i_rdev == WHITEOUT_DEV)
-+#define IS_ANON_FILE(inode)	((inode)->i_flags & S_ANON_INODE)
- 
- static inline bool HAS_UNMAPPED_ID(struct mnt_idmap *idmap,
- 				   struct inode *inode)
--- a/mm/readahead.c
-+++ b/mm/readahead.c
-@@ -690,9 +690,15 @@ EXPORT_SYMBOL_GPL(page_cache_async_ra);
- 
- ssize_t ksys_readahead(int fd, loff_t offset, size_t count)
- {
-+	struct file *file;
-+	const struct inode *inode;
-+
- 	CLASS(fd, f)(fd);
-+	if (fd_empty(f))
-+		return -EBADF;
- 
-	if (fd_empty(f) || !(fd_file(f)->f_mode & FMODE_READ))
-+	file = fd_file(f);
-+	if (!(file->f_mode & FMODE_READ))
- 		return -EBADF;
- 
- 	/*
-@@ -700,9 +706,15 @@ ssize_t ksys_readahead(int fd, loff_t of
- 	 * that can execute readahead. If readahead is not possible
- 	 * on this file, then we must return -EINVAL.
- 	 */
-	if (!fd_file(f)->f_mapping || !fd_file(f)->f_mapping->a_ops ||
-	    (!S_ISREG(file_inode(fd_file(f))->i_mode) &&
-	    !S_ISBLK(file_inode(fd_file(f))->i_mode)))
-+	if (!file->f_mapping)
-+		return -EINVAL;
-+	if (!file->f_mapping->a_ops)
-+		return -EINVAL;
-+
-+	inode = file_inode(file);
-+	if (!S_ISREG(inode->i_mode) && !S_ISBLK(inode->i_mode))
-+		return -EINVAL;
-+	if (IS_ANON_FILE(inode))
- 		return -EINVAL;
- 
- 	return vfs_fadvise(fd_file(f), offset, count, POSIX_FADV_WILLNEED);
--- a/debian/patches/patchset-pf/fixes/0008-mm-gup-revert-mm-gup-fix-infinite-loop-within-__get_.patch
+++ b/debian/patches/patchset-pf/fixes/0008-mm-gup-revert-mm-gup-fix-infinite-loop-within-__get_.patch
@@ -0,0 +1,100 @@
+From 4b247e559e4046bbbfab468e66f9d3197eaf12ec Mon Sep 17 00:00:00 2001
+From: David Hildenbrand <david@redhat.com>
+Date: Wed, 11 Jun 2025 15:13:14 +0200
+Subject: mm/gup: revert "mm: gup: fix infinite loop within
+ __get_longterm_locked"
+
+After commit 1aaf8c122918 ("mm: gup: fix infinite loop within
+__get_longterm_locked") we are able to longterm pin folios that are not
+supposed to get longterm pinned, simply because they temporarily have the
+LRU flag cleared (esp.  temporarily isolated).
+
+For example, two __get_longterm_locked() callers can race, or
+__get_longterm_locked() can race with anything else that temporarily
+isolates folios.
+
+The introducing commit mentions the use case of a driver that uses
+vm_ops->fault to insert pages allocated through cma_alloc() into the page
+tables, assuming they can later get longterm pinned.  These pages/ folios
+would never have the LRU flag set and consequently cannot get isolated.
+There is no known in-tree user making use of that so far, fortunately.
+
+To handle that in the future -- and avoid retrying forever to
+isolate/migrate them -- we will need a different mechanism for the CMA
+area *owner* to indicate that it actually already allocated the page and
+is fine with longterm pinning it.  The LRU flag is not suitable for that.
+
+Probably we can lookup the relevant CMA area and query the bitmap; we only
+have have to care about some races, probably.  If already allocated, we
+could just allow longterm pinning)
+
+Anyhow, let's fix the "must not be longterm pinned" problem first by
+reverting the original commit.
+
+Link: https://lkml.kernel.org/r/20250611131314.594529-1-david@redhat.com
+Fixes: 1aaf8c122918 ("mm: gup: fix infinite loop within __get_longterm_locked")
+Signed-off-by: David Hildenbrand <david@redhat.com>
+Closes: https://lore.kernel.org/all/20250522092755.GA3277597@tiffany/
+Reported-by: Hyesoo Yu <hyesoo.yu@samsung.com>
+Reviewed-by: John Hubbard <jhubbard@nvidia.com>
+Cc: Jason Gunthorpe <jgg@ziepe.ca>
+Cc: Peter Xu <peterx@redhat.com>
+Cc: Zhaoyang Huang <zhaoyang.huang@unisoc.com>
+Cc: Aijun Sun <aijun.sun@unisoc.com>
+Cc: Alistair Popple <apopple@nvidia.com>
+Cc: <stable@vger.kernel.org>
+Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
+---
+ mm/gup.c | 14 ++++++++++----
+ 1 file changed, 10 insertions(+), 4 deletions(-)
+
+--- a/mm/gup.c
+++ b/mm/gup.c
+@@ -2320,13 +2320,13 @@ static void pofs_unpin(struct pages_or_f
+ /*
+  * Returns the number of collected folios. Return value is always >= 0.
+  */
+-static void collect_longterm_unpinnable_folios(
+static unsigned long collect_longterm_unpinnable_folios(
+ 		struct list_head *movable_folio_list,
+ 		struct pages_or_folios *pofs)
+ {
+	unsigned long i, collected = 0;
+ 	struct folio *prev_folio = NULL;
+ 	bool drain_allow = true;
+-	unsigned long i;
+ 
+ 	for (i = 0; i < pofs->nr_entries; i++) {
+ 		struct folio *folio = pofs_get_folio(pofs, i);
+@@ -2338,6 +2338,8 @@ static void collect_longterm_unpinnable_
+ 		if (folio_is_longterm_pinnable(folio))
+ 			continue;
+ 
+		collected++;
+
+ 		if (folio_is_device_coherent(folio))
+ 			continue;
+ 
+@@ -2359,6 +2361,8 @@ static void collect_longterm_unpinnable_
+ 				    NR_ISOLATED_ANON + folio_is_file_lru(folio),
+ 				    folio_nr_pages(folio));
+ 	}
+
+	return collected;
+ }
+ 
+ /*
+@@ -2435,9 +2439,11 @@ static long
+ check_and_migrate_movable_pages_or_folios(struct pages_or_folios *pofs)
+ {
+ 	LIST_HEAD(movable_folio_list);
+	unsigned long collected;
+ 
+-	collect_longterm_unpinnable_folios(&movable_folio_list, pofs);
+-	if (list_empty(&movable_folio_list))
+	collected = collect_longterm_unpinnable_folios(&movable_folio_list,
+						       pofs);
+	if (!collected)
+ 		return 0;
+ 
+ 	return migrate_longterm_unpinnable_folios(&movable_folio_list, pofs);
--- a/debian/patches/patchset-pf/fixes/0009-configfs-Do-not-override-creating-attribute-file-fai.patch
+++ b/debian/patches/patchset-pf/fixes/0009-configfs-Do-not-override-creating-attribute-file-fai.patch
@@ -1,35 +0,0 @@
-From c161e0ffb55a12b9b26819fa0ecf8217ab781e97 Mon Sep 17 00:00:00 2001
-From: Zijun Hu <quic_zijuhu@quicinc.com>
-Date: Wed, 7 May 2025 19:50:26 +0800
-Subject: configfs: Do not override creating attribute file failure in
- populate_attrs()
-
-populate_attrs() may override failure for creating attribute files
-by success for creating subsequent bin attribute files, and have
-wrong return value.
-
-Fix by creating bin attribute files under successfully creating
-attribute files.
-
-Fixes: 03607ace807b ("configfs: implement binary attributes")
-Cc: stable@vger.kernel.org
-Reviewed-by: Joel Becker <jlbec@evilplan.org>
-Reviewed-by: Breno Leitao <leitao@debian.org>
-Signed-off-by: Zijun Hu <quic_zijuhu@quicinc.com>
-Link: https://lore.kernel.org/r/20250507-fix_configfs-v3-2-fe2d96de8dc4@quicinc.com
-Signed-off-by: Andreas Hindborg <a.hindborg@kernel.org>
---
- fs/configfs/dir.c | 2 +-
- 1 file changed, 1 insertion(+), 1 deletion(-)
-
--- a/fs/configfs/dir.c
-+++ b/fs/configfs/dir.c
-@@ -619,7 +619,7 @@ static int populate_attrs(struct config_
- 				break;
- 		}
- 	}
-	if (t->ct_bin_attrs) {
-+	if (!error && t->ct_bin_attrs) {
- 		for (i = 0; (bin_attr = t->ct_bin_attrs[i]) != NULL; i++) {
- 			if (ops && ops->is_bin_visible && !ops->is_bin_visible(item, bin_attr, i))
- 				continue;
--- a/debian/patches/patchset-pf/fixes/0009-mm-userfaultfd-fix-race-of-userfaultfd_move-and-swap.patch
+++ b/debian/patches/patchset-pf/fixes/0009-mm-userfaultfd-fix-race-of-userfaultfd_move-and-swap.patch
@@ -0,0 +1,191 @@
+From 7ebf89b788aa5b83897e99ad6e3dd6e0cb0f5030 Mon Sep 17 00:00:00 2001
+From: Kairui Song <kasong@tencent.com>
+Date: Wed, 4 Jun 2025 23:10:38 +0800
+Subject: mm: userfaultfd: fix race of userfaultfd_move and swap cache
+
+This commit fixes two kinds of races, they may have different results:
+
+Barry reported a BUG_ON in commit c50f8e6053b0, we may see the same
+BUG_ON if the filemap lookup returned NULL and folio is added to swap
+cache after that.
+
+If another kind of race is triggered (folio changed after lookup) we
+may see RSS counter is corrupted:
+
+[  406.893936] BUG: Bad rss-counter state mm:ffff0000c5a9ddc0
+type:MM_ANONPAGES val:-1
+[  406.894071] BUG: Bad rss-counter state mm:ffff0000c5a9ddc0
+type:MM_SHMEMPAGES val:1
+
+Because the folio is being accounted to the wrong VMA.
+
+I'm not sure if there will be any data corruption though, seems no.
+The issues above are critical already.
+
+
+On seeing a swap entry PTE, userfaultfd_move does a lockless swap cache
+lookup, and tries to move the found folio to the faulting vma.  Currently,
+it relies on checking the PTE value to ensure that the moved folio still
+belongs to the src swap entry and that no new folio has been added to the
+swap cache, which turns out to be unreliable.
+
+While working and reviewing the swap table series with Barry, following
+existing races are observed and reproduced [1]:
+
+In the example below, move_pages_pte is moving src_pte to dst_pte, where
+src_pte is a swap entry PTE holding swap entry S1, and S1 is not in the
+swap cache:
+
+CPU1                               CPU2
+userfaultfd_move
+  move_pages_pte()
+    entry = pte_to_swp_entry(orig_src_pte);
+    // Here it got entry = S1
+    ... < interrupted> ...
+                                   <swapin src_pte, alloc and use folio A>
+                                   // folio A is a new allocated folio
+                                   // and get installed into src_pte
+                                   <frees swap entry S1>
+                                   // src_pte now points to folio A, S1
+                                   // has swap count == 0, it can be freed
+                                   // by folio_swap_swap or swap
+                                   // allocator's reclaim.
+                                   <try to swap out another folio B>
+                                   // folio B is a folio in another VMA.
+                                   <put folio B to swap cache using S1 >
+                                   // S1 is freed, folio B can use it
+                                   // for swap out with no problem.
+                                   ...
+    folio = filemap_get_folio(S1)
+    // Got folio B here !!!
+    ... < interrupted again> ...
+                                   <swapin folio B and free S1>
+                                   // Now S1 is free to be used again.
+                                   <swapout src_pte & folio A using S1>
+                                   // Now src_pte is a swap entry PTE
+                                   // holding S1 again.
+    folio_trylock(folio)
+    move_swap_pte
+      double_pt_lock
+      is_pte_pages_stable
+      // Check passed because src_pte == S1
+      folio_move_anon_rmap(...)
+      // Moved invalid folio B here !!!
+
+The race window is very short and requires multiple collisions of multiple
+rare events, so it's very unlikely to happen, but with a deliberately
+constructed reproducer and increased time window, it can be reproduced
+easily.
+
+This can be fixed by checking if the folio returned by filemap is the
+valid swap cache folio after acquiring the folio lock.
+
+Another similar race is possible: filemap_get_folio may return NULL, but
+folio (A) could be swapped in and then swapped out again using the same
+swap entry after the lookup.  In such a case, folio (A) may remain in the
+swap cache, so it must be moved too:
+
+CPU1                               CPU2
+userfaultfd_move
+  move_pages_pte()
+    entry = pte_to_swp_entry(orig_src_pte);
+    // Here it got entry = S1, and S1 is not in swap cache
+    folio = filemap_get_folio(S1)
+    // Got NULL
+    ... < interrupted again> ...
+                                   <swapin folio A and free S1>
+                                   <swapout folio A re-using S1>
+    move_swap_pte
+      double_pt_lock
+      is_pte_pages_stable
+      // Check passed because src_pte == S1
+      folio_move_anon_rmap(...)
+      // folio A is ignored !!!
+
+Fix this by checking the swap cache again after acquiring the src_pte
+lock.  And to avoid the filemap overhead, we check swap_map directly [2].
+
+The SWP_SYNCHRONOUS_IO path does make the problem more complex, but so far
+we don't need to worry about that, since folios can only be exposed to the
+swap cache in the swap out path, and this is covered in this patch by
+checking the swap cache again after acquiring the src_pte lock.
+
+Testing with a simple C program that allocates and moves several GB of
+memory did not show any observable performance change.
+
+Link: https://lkml.kernel.org/r/20250604151038.21968-1-ryncsn@gmail.com
+Fixes: adef440691ba ("userfaultfd: UFFDIO_MOVE uABI")
+Signed-off-by: Kairui Song <kasong@tencent.com>
+Closes: https://lore.kernel.org/linux-mm/CAMgjq7B1K=6OOrK2OUZ0-tqCzi+EJt+2_K97TPGoSt=9+JwP7Q@mail.gmail.com/ [1]
+Link: https://lore.kernel.org/all/CAGsJ_4yJhJBo16XhiC-nUzSheyX-V3-nFE+tAi=8Y560K8eT=A@mail.gmail.com/ [2]
+Reviewed-by: Lokesh Gidra <lokeshgidra@google.com>
+Acked-by: Peter Xu <peterx@redhat.com>
+Reviewed-by: Suren Baghdasaryan <surenb@google.com>
+Reviewed-by: Barry Song <baohua@kernel.org>
+Reviewed-by: Chris Li <chrisl@kernel.org>
+Cc: Andrea Arcangeli <aarcange@redhat.com>
+Cc: David Hildenbrand <david@redhat.com>
+Cc: Kairui Song <kasong@tencent.com>
+Cc: <stable@vger.kernel.org>
+Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
+---
+ mm/userfaultfd.c | 33 +++++++++++++++++++++++++++++++--
+ 1 file changed, 31 insertions(+), 2 deletions(-)
+
+--- a/mm/userfaultfd.c
+++ b/mm/userfaultfd.c
+@@ -1084,8 +1084,18 @@ static int move_swap_pte(struct mm_struc
+ 			 pte_t orig_dst_pte, pte_t orig_src_pte,
+ 			 pmd_t *dst_pmd, pmd_t dst_pmdval,
+ 			 spinlock_t *dst_ptl, spinlock_t *src_ptl,
+-			 struct folio *src_folio)
+			 struct folio *src_folio,
+			 struct swap_info_struct *si, swp_entry_t entry)
+ {
+	/*
+	 * Check if the folio still belongs to the target swap entry after
+	 * acquiring the lock. Folio can be freed in the swap cache while
+	 * not locked.
+	 */
+	if (src_folio && unlikely(!folio_test_swapcache(src_folio) ||
+				  entry.val != src_folio->swap.val))
+		return -EAGAIN;
+
+ 	double_pt_lock(dst_ptl, src_ptl);
+ 
+ 	if (!is_pte_pages_stable(dst_pte, src_pte, orig_dst_pte, orig_src_pte,
+@@ -1102,6 +1112,25 @@ static int move_swap_pte(struct mm_struc
+ 	if (src_folio) {
+ 		folio_move_anon_rmap(src_folio, dst_vma);
+ 		src_folio->index = linear_page_index(dst_vma, dst_addr);
+	} else {
+		/*
+		 * Check if the swap entry is cached after acquiring the src_pte
+		 * lock. Otherwise, we might miss a newly loaded swap cache folio.
+		 *
+		 * Check swap_map directly to minimize overhead, READ_ONCE is sufficient.
+		 * We are trying to catch newly added swap cache, the only possible case is
+		 * when a folio is swapped in and out again staying in swap cache, using the
+		 * same entry before the PTE check above. The PTL is acquired and released
+		 * twice, each time after updating the swap_map's flag. So holding
+		 * the PTL here ensures we see the updated value. False positive is possible,
+		 * e.g. SWP_SYNCHRONOUS_IO swapin may set the flag without touching the
+		 * cache, or during the tiny synchronization window between swap cache and
+		 * swap_map, but it will be gone very quickly, worst result is retry jitters.
+		 */
+		if (READ_ONCE(si->swap_map[swp_offset(entry)]) & SWAP_HAS_CACHE) {
+			double_pt_unlock(dst_ptl, src_ptl);
+			return -EAGAIN;
+		}
+ 	}
+ 
+ 	orig_src_pte = ptep_get_and_clear(mm, src_addr, src_pte);
+@@ -1412,7 +1441,7 @@ retry:
+ 		}
+ 		err = move_swap_pte(mm, dst_vma, dst_addr, src_addr, dst_pte, src_pte,
+ 				orig_dst_pte, orig_src_pte, dst_pmd, dst_pmdval,
+-				dst_ptl, src_ptl, src_folio);
+				dst_ptl, src_ptl, src_folio, si, entry);
+ 	}
+ 
+ out:
--- a/debian/patches/patchset-pf/fixes/0010-dm-raid-fix-variable-in-journal-device-check.patch
+++ b/debian/patches/patchset-pf/fixes/0010-dm-raid-fix-variable-in-journal-device-check.patch
@@ -0,0 +1,26 @@
+From 222985dcb732fae554af5276f44c30d648a1d05b Mon Sep 17 00:00:00 2001
+From: Heinz Mauelshagen <heinzm@redhat.com>
+Date: Tue, 10 Jun 2025 20:53:30 +0200
+Subject: dm-raid: fix variable in journal device check
+
+Replace "rdev" with correct loop variable name "r".
+
+Signed-off-by: Heinz Mauelshagen <heinzm@redhat.com>
+Cc: stable@vger.kernel.org
+Fixes: 63c32ed4afc2 ("dm raid: add raid4/5/6 journaling support")
+Signed-off-by: Mikulas Patocka <mpatocka@redhat.com>
+---
+ drivers/md/dm-raid.c | 2 +-
+ 1 file changed, 1 insertion(+), 1 deletion(-)
+
+--- a/drivers/md/dm-raid.c
+++ b/drivers/md/dm-raid.c
+@@ -2410,7 +2410,7 @@ static int super_init_validation(struct
+ 	 */
+ 	sb_retrieve_failed_devices(sb, failed_devices);
+ 	rdev_for_each(r, mddev) {
+-		if (test_bit(Journal, &rdev->flags) ||
+		if (test_bit(Journal, &r->flags) ||
+ 		    !r->sb_page)
+ 			continue;
+ 		sb2 = page_address(r->sb_page);
--- a/debian/patches/patchset-pf/fixes/0015-mm-fix-uprobe-pte-be-overwritten-when-expanding-vma.patch
+++ b/debian/patches/patchset-pf/fixes/0015-mm-fix-uprobe-pte-be-overwritten-when-expanding-vma.patch
@@ -1,129 +0,0 @@
-From 1e9a258def978a9388a50ae43c85557b0598a7d3 Mon Sep 17 00:00:00 2001
-From: Pu Lehui <pulehui@huawei.com>
-Date: Thu, 29 May 2025 15:56:47 +0000
-Subject: mm: fix uprobe pte be overwritten when expanding vma
-
-Patch series "Fix uprobe pte be overwritten when expanding vma".
-
-
-This patch (of 4):
-
-We encountered a BUG alert triggered by Syzkaller as follows:
-   BUG: Bad rss-counter state mm:00000000b4a60fca type:MM_ANONPAGES val:1
-
-And we can reproduce it with the following steps:
-1. register uprobe on file at zero offset
-2. mmap the file at zero offset:
-   addr1 = mmap(NULL, 2 * 4096, PROT_NONE, MAP_PRIVATE, fd, 0);
-3. mremap part of vma1 to new vma2:
-   addr2 = mremap(addr1, 4096, 2 * 4096, MREMAP_MAYMOVE);
-4. mremap back to orig addr1:
-   mremap(addr2, 4096, 4096, MREMAP_MAYMOVE | MREMAP_FIXED, addr1);
-
-In step 3, the vma1 range [addr1, addr1 + 4096] will be remap to new vma2
-with range [addr2, addr2 + 8192], and remap uprobe anon page from the vma1
-to vma2, then unmap the vma1 range [addr1, addr1 + 4096].
-
-In step 4, the vma2 range [addr2, addr2 + 4096] will be remap back to the
-addr range [addr1, addr1 + 4096].  Since the addr range [addr1 + 4096,
-addr1 + 8192] still maps the file, it will take vma_merge_new_range to
-expand the range, and then do uprobe_mmap in vma_complete.  Since the
-merged vma pgoff is also zero offset, it will install uprobe anon page to
-the merged vma.  However, the upcomming move_page_tables step, which use
-set_pte_at to remap the vma2 uprobe pte to the merged vma, will overwrite
-the newly uprobe pte in the merged vma, and lead that pte to be orphan.
-
-Since the uprobe pte will be remapped to the merged vma, we can remove the
-unnecessary uprobe_mmap upon merged vma.
-
-This problem was first found in linux-6.6.y and also exists in the
-community syzkaller:
-https://lore.kernel.org/all/000000000000ada39605a5e71711@google.com/T/
-
-Link: https://lkml.kernel.org/r/20250529155650.4017699-1-pulehui@huaweicloud.com
-Link: https://lkml.kernel.org/r/20250529155650.4017699-2-pulehui@huaweicloud.com
-Fixes: 2b1444983508 ("uprobes, mm, x86: Add the ability to install and remove uprobes breakpoints")
-Signed-off-by: Pu Lehui <pulehui@huawei.com>
-Suggested-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Reviewed-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Acked-by: David Hildenbrand <david@redhat.com>
-Cc: Jann Horn <jannh@google.com>
-Cc: Liam Howlett <liam.howlett@oracle.com>
-Cc: "Masami Hiramatsu (Google)" <mhiramat@kernel.org>
-Cc: Oleg Nesterov <oleg@redhat.com>
-Cc: Peter Zijlstra <peterz@infradead.org>
-Cc: Vlastimil Babka <vbabka@suse.cz>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- mm/vma.c | 20 +++++++++++++++++---
- mm/vma.h |  7 +++++++
- 2 files changed, 24 insertions(+), 3 deletions(-)
-
--- a/mm/vma.c
-+++ b/mm/vma.c
-@@ -144,6 +144,9 @@ static void init_multi_vma_prep(struct v
- 	vp->file = vma->vm_file;
- 	if (vp->file)
- 		vp->mapping = vma->vm_file->f_mapping;
-+
-+	if (vmg && vmg->skip_vma_uprobe)
-+		vp->skip_vma_uprobe = true;
- }
- 
- /*
-@@ -333,10 +336,13 @@ static void vma_complete(struct vma_prep
- 
- 	if (vp->file) {
- 		i_mmap_unlock_write(vp->mapping);
-		uprobe_mmap(vp->vma);
- 
-		if (vp->adj_next)
-			uprobe_mmap(vp->adj_next);
-+		if (!vp->skip_vma_uprobe) {
-+			uprobe_mmap(vp->vma);
-+
-+			if (vp->adj_next)
-+				uprobe_mmap(vp->adj_next);
-+		}
- 	}
- 
- 	if (vp->remove) {
-@@ -1783,6 +1789,14 @@ struct vm_area_struct *copy_vma(struct v
- 		faulted_in_anon_vma = false;
- 	}
- 
-+	/*
-+	 * If the VMA we are copying might contain a uprobe PTE, ensure
-+	 * that we do not establish one upon merge. Otherwise, when mremap()
-+	 * moves page tables, it will orphan the newly created PTE.
-+	 */
-+	if (vma->vm_file)
-+		vmg.skip_vma_uprobe = true;
-+
- 	new_vma = find_vma_prev(mm, addr, &vmg.prev);
- 	if (new_vma && new_vma->vm_start < addr + len)
- 		return NULL;	/* should never get here */
--- a/mm/vma.h
-+++ b/mm/vma.h
-@@ -19,6 +19,8 @@ struct vma_prepare {
- 	struct vm_area_struct *insert;
- 	struct vm_area_struct *remove;
- 	struct vm_area_struct *remove2;
-+
-+	bool skip_vma_uprobe :1;
- };
- 
- struct unlink_vma_file_batch {
-@@ -120,6 +122,11 @@ struct vma_merge_struct {
- 	 */
- 	bool give_up_on_oom :1;
- 
-+	/*
-+	 * If set, skip uprobe_mmap upon merged vma.
-+	 */
-+	bool skip_vma_uprobe :1;
-+
- 	/* Internal flags set during merge process: */
- 
- 	/*
--- a/debian/patches/patchset-pf/fixes/0016-mm-hugetlb-unshare-page-tables-during-VMA-split-not-.patch
+++ b/debian/patches/patchset-pf/fixes/0016-mm-hugetlb-unshare-page-tables-during-VMA-split-not-.patch
@@ -1,217 +0,0 @@
-From 2d8c79ec421253aab9560a47a7e73d678c84585c Mon Sep 17 00:00:00 2001
-From: Jann Horn <jannh@google.com>
-Date: Tue, 27 May 2025 23:23:53 +0200
-Subject: mm/hugetlb: unshare page tables during VMA split, not before
-
-Currently, __split_vma() triggers hugetlb page table unsharing through
-vm_ops->may_split().  This happens before the VMA lock and rmap locks are
-taken - which is too early, it allows racing VMA-locked page faults in our
-process and racing rmap walks from other processes to cause page tables to
-be shared again before we actually perform the split.
-
-Fix it by explicitly calling into the hugetlb unshare logic from
-__split_vma() in the same place where THP splitting also happens.  At that
-point, both the VMA and the rmap(s) are write-locked.
-
-An annoying detail is that we can now call into the helper
-hugetlb_unshare_pmds() from two different locking contexts:
-
-1. from hugetlb_split(), holding:
-    - mmap lock (exclusively)
-    - VMA lock
-    - file rmap lock (exclusively)
-2. hugetlb_unshare_all_pmds(), which I think is designed to be able to
-   call us with only the mmap lock held (in shared mode), but currently
-   only runs while holding mmap lock (exclusively) and VMA lock
-
-Backporting note:
-This commit fixes a racy protection that was introduced in commit
-b30c14cd6102 ("hugetlb: unshare some PMDs when splitting VMAs"); that
-commit claimed to fix an issue introduced in 5.13, but it should actually
-also go all the way back.
-
-[jannh@google.com: v2]
-  Link: https://lkml.kernel.org/r/20250528-hugetlb-fixes-splitrace-v2-1-1329349bad1a@google.com
-Link: https://lkml.kernel.org/r/20250528-hugetlb-fixes-splitrace-v2-0-1329349bad1a@google.com
-Link: https://lkml.kernel.org/r/20250527-hugetlb-fixes-splitrace-v1-1-f4136f5ec58a@google.com
-Fixes: 39dde65c9940 ("[PATCH] shared page table for hugetlb page")
-Signed-off-by: Jann Horn <jannh@google.com>
-Cc: Liam Howlett <liam.howlett@oracle.com>
-Reviewed-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Reviewed-by: Oscar Salvador <osalvador@suse.de>
-Cc: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Cc: Vlastimil Babka <vbabka@suse.cz>
-Cc: <stable@vger.kernel.org>	[b30c14cd6102: hugetlb: unshare some PMDs when splitting VMAs]
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- include/linux/hugetlb.h          |  3 ++
- mm/hugetlb.c                     | 60 +++++++++++++++++++++++---------
- mm/vma.c                         |  7 ++++
- tools/testing/vma/vma_internal.h |  2 ++
- 4 files changed, 56 insertions(+), 16 deletions(-)
-
--- a/include/linux/hugetlb.h
-+++ b/include/linux/hugetlb.h
-@@ -276,6 +276,7 @@ bool is_hugetlb_entry_migration(pte_t pt
- bool is_hugetlb_entry_hwpoisoned(pte_t pte);
- void hugetlb_unshare_all_pmds(struct vm_area_struct *vma);
- void fixup_hugetlb_reservations(struct vm_area_struct *vma);
-+void hugetlb_split(struct vm_area_struct *vma, unsigned long addr);
- 
- #else /* !CONFIG_HUGETLB_PAGE */
- 
-@@ -473,6 +474,8 @@ static inline void fixup_hugetlb_reserva
- {
- }
- 
-+static inline void hugetlb_split(struct vm_area_struct *vma, unsigned long addr) {}
-+
- #endif /* !CONFIG_HUGETLB_PAGE */
- 
- #ifndef pgd_write
--- a/mm/hugetlb.c
-+++ b/mm/hugetlb.c
-@@ -120,7 +120,7 @@ static void hugetlb_vma_lock_free(struct
- static void hugetlb_vma_lock_alloc(struct vm_area_struct *vma);
- static void __hugetlb_vma_unlock_write_free(struct vm_area_struct *vma);
- static void hugetlb_unshare_pmds(struct vm_area_struct *vma,
-		unsigned long start, unsigned long end);
-+		unsigned long start, unsigned long end, bool take_locks);
- static struct resv_map *vma_resv_map(struct vm_area_struct *vma);
- 
- static void hugetlb_free_folio(struct folio *folio)
-@@ -5426,26 +5426,40 @@ static int hugetlb_vm_op_split(struct vm
- {
- 	if (addr & ~(huge_page_mask(hstate_vma(vma))))
- 		return -EINVAL;
-+	return 0;
-+}
- 
-+void hugetlb_split(struct vm_area_struct *vma, unsigned long addr)
-+{
- 	/*
- 	 * PMD sharing is only possible for PUD_SIZE-aligned address ranges
- 	 * in HugeTLB VMAs. If we will lose PUD_SIZE alignment due to this
- 	 * split, unshare PMDs in the PUD_SIZE interval surrounding addr now.
-+	 * This function is called in the middle of a VMA split operation, with
-+	 * MM, VMA and rmap all write-locked to prevent concurrent page table
-+	 * walks (except hardware and gup_fast()).
- 	 */
-+	vma_assert_write_locked(vma);
-+	i_mmap_assert_write_locked(vma->vm_file->f_mapping);
-+
- 	if (addr & ~PUD_MASK) {
-		/*
-		 * hugetlb_vm_op_split is called right before we attempt to
-		 * split the VMA. We will need to unshare PMDs in the old and
-		 * new VMAs, so let's unshare before we split.
-		 */
- 		unsigned long floor = addr & PUD_MASK;
- 		unsigned long ceil = floor + PUD_SIZE;
- 
-		if (floor >= vma->vm_start && ceil <= vma->vm_end)
-			hugetlb_unshare_pmds(vma, floor, ceil);
-+		if (floor >= vma->vm_start && ceil <= vma->vm_end) {
-+			/*
-+			 * Locking:
-+			 * Use take_locks=false here.
-+			 * The file rmap lock is already held.
-+			 * The hugetlb VMA lock can't be taken when we already
-+			 * hold the file rmap lock, and we don't need it because
-+			 * its purpose is to synchronize against concurrent page
-+			 * table walks, which are not possible thanks to the
-+			 * locks held by our caller.
-+			 */
-+			hugetlb_unshare_pmds(vma, floor, ceil, /* take_locks = */ false);
-+		}
- 	}
-
-	return 0;
- }
- 
- static unsigned long hugetlb_vm_op_pagesize(struct vm_area_struct *vma)
-@@ -7884,9 +7898,16 @@ void move_hugetlb_state(struct folio *ol
- 	spin_unlock_irq(&hugetlb_lock);
- }
- 
-+/*
-+ * If @take_locks is false, the caller must ensure that no concurrent page table
-+ * access can happen (except for gup_fast() and hardware page walks).
-+ * If @take_locks is true, we take the hugetlb VMA lock (to lock out things like
-+ * concurrent page fault handling) and the file rmap lock.
-+ */
- static void hugetlb_unshare_pmds(struct vm_area_struct *vma,
- 				   unsigned long start,
-				   unsigned long end)
-+				   unsigned long end,
-+				   bool take_locks)
- {
- 	struct hstate *h = hstate_vma(vma);
- 	unsigned long sz = huge_page_size(h);
-@@ -7910,8 +7931,12 @@ static void hugetlb_unshare_pmds(struct
- 	mmu_notifier_range_init(&range, MMU_NOTIFY_CLEAR, 0, mm,
- 				start, end);
- 	mmu_notifier_invalidate_range_start(&range);
-	hugetlb_vma_lock_write(vma);
-	i_mmap_lock_write(vma->vm_file->f_mapping);
-+	if (take_locks) {
-+		hugetlb_vma_lock_write(vma);
-+		i_mmap_lock_write(vma->vm_file->f_mapping);
-+	} else {
-+		i_mmap_assert_write_locked(vma->vm_file->f_mapping);
-+	}
- 	for (address = start; address < end; address += PUD_SIZE) {
- 		ptep = hugetlb_walk(vma, address, sz);
- 		if (!ptep)
-@@ -7921,8 +7946,10 @@ static void hugetlb_unshare_pmds(struct
- 		spin_unlock(ptl);
- 	}
- 	flush_hugetlb_tlb_range(vma, start, end);
-	i_mmap_unlock_write(vma->vm_file->f_mapping);
-	hugetlb_vma_unlock_write(vma);
-+	if (take_locks) {
-+		i_mmap_unlock_write(vma->vm_file->f_mapping);
-+		hugetlb_vma_unlock_write(vma);
-+	}
- 	/*
- 	 * No need to call mmu_notifier_arch_invalidate_secondary_tlbs(), see
- 	 * Documentation/mm/mmu_notifier.rst.
-@@ -7937,7 +7964,8 @@ static void hugetlb_unshare_pmds(struct
- void hugetlb_unshare_all_pmds(struct vm_area_struct *vma)
- {
- 	hugetlb_unshare_pmds(vma, ALIGN(vma->vm_start, PUD_SIZE),
-			ALIGN_DOWN(vma->vm_end, PUD_SIZE));
-+			ALIGN_DOWN(vma->vm_end, PUD_SIZE),
-+			/* take_locks = */ true);
- }
- 
- /*
--- a/mm/vma.c
-+++ b/mm/vma.c
-@@ -516,7 +516,14 @@ __split_vma(struct vma_iterator *vmi, st
- 	init_vma_prep(&vp, vma);
- 	vp.insert = new;
- 	vma_prepare(&vp);
-+
-+	/*
-+	 * Get rid of huge pages and shared page tables straddling the split
-+	 * boundary.
-+	 */
- 	vma_adjust_trans_huge(vma, vma->vm_start, addr, NULL);
-+	if (is_vm_hugetlb_page(vma))
-+		hugetlb_split(vma, addr);
- 
- 	if (new_below) {
- 		vma->vm_start = addr;
--- a/tools/testing/vma/vma_internal.h
-+++ b/tools/testing/vma/vma_internal.h
-@@ -793,6 +793,8 @@ static inline void vma_adjust_trans_huge
- 	(void)next;
- }
- 
-+static inline void hugetlb_split(struct vm_area_struct *, unsigned long) {}
-+
- static inline void vma_iter_free(struct vma_iterator *vmi)
- {
- 	mas_destroy(&vmi->mas);
--- a/debian/patches/patchset-pf/fixes/0017-mm-hugetlb-fix-huge_pmd_unshare-vs-GUP-fast-race.patch
+++ b/debian/patches/patchset-pf/fixes/0017-mm-hugetlb-fix-huge_pmd_unshare-vs-GUP-fast-race.patch
@@ -1,50 +0,0 @@
-From e1280358284feaf844db5c6a76078b2c1738c5ae Mon Sep 17 00:00:00 2001
-From: Jann Horn <jannh@google.com>
-Date: Tue, 27 May 2025 23:23:54 +0200
-Subject: mm/hugetlb: fix huge_pmd_unshare() vs GUP-fast race
-
-huge_pmd_unshare() drops a reference on a page table that may have
-previously been shared across processes, potentially turning it into a
-normal page table used in another process in which unrelated VMAs can
-afterwards be installed.
-
-If this happens in the middle of a concurrent gup_fast(), gup_fast() could
-end up walking the page tables of another process.  While I don't see any
-way in which that immediately leads to kernel memory corruption, it is
-really weird and unexpected.
-
-Fix it with an explicit broadcast IPI through tlb_remove_table_sync_one(),
-just like we do in khugepaged when removing page tables for a THP
-collapse.
-
-Link: https://lkml.kernel.org/r/20250528-hugetlb-fixes-splitrace-v2-2-1329349bad1a@google.com
-Link: https://lkml.kernel.org/r/20250527-hugetlb-fixes-splitrace-v1-2-f4136f5ec58a@google.com
-Fixes: 39dde65c9940 ("[PATCH] shared page table for hugetlb page")
-Signed-off-by: Jann Horn <jannh@google.com>
-Reviewed-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Cc: Liam Howlett <liam.howlett@oracle.com>
-Cc: Muchun Song <muchun.song@linux.dev>
-Cc: Oscar Salvador <osalvador@suse.de>
-Cc: Vlastimil Babka <vbabka@suse.cz>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- mm/hugetlb.c | 7 +++++++
- 1 file changed, 7 insertions(+)
-
--- a/mm/hugetlb.c
-+++ b/mm/hugetlb.c
-@@ -7628,6 +7628,13 @@ int huge_pmd_unshare(struct mm_struct *m
- 		return 0;
- 
- 	pud_clear(pud);
-+	/*
-+	 * Once our caller drops the rmap lock, some other process might be
-+	 * using this page table as a normal, non-hugetlb page table.
-+	 * Wait for pending gup_fast() in other threads to finish before letting
-+	 * that happen.
-+	 */
-+	tlb_remove_table_sync_one();
- 	ptdesc_pmd_pts_dec(virt_to_ptdesc(ptep));
- 	mm_dec_nr_pmds(mm);
- 	return 1;
--- a/debian/patches/patchset-pf/fixes/0018-mm-madvise-handle-madvise_lock-failure-during-race-u.patch
+++ b/debian/patches/patchset-pf/fixes/0018-mm-madvise-handle-madvise_lock-failure-during-race-u.patch
@@ -1,48 +0,0 @@
-From b36611870ea72c82eb78d90a017658394bdb9690 Mon Sep 17 00:00:00 2001
-From: SeongJae Park <sj@kernel.org>
-Date: Mon, 2 Jun 2025 10:49:26 -0700
-Subject: mm/madvise: handle madvise_lock() failure during race unwinding
-
-When unwinding race on -ERESTARTNOINTR handling of process_madvise(),
-madvise_lock() failure is ignored.  Check the failure and abort remaining
-works in the case.
-
-Link: https://lkml.kernel.org/r/20250602174926.1074-1-sj@kernel.org
-Fixes: 4000e3d0a367 ("mm/madvise: remove redundant mmap_lock operations from process_madvise()")
-Signed-off-by: SeongJae Park <sj@kernel.org>
-Reported-by: Barry Song <21cnbao@gmail.com>
-Closes: https://lore.kernel.org/CAGsJ_4xJXXO0G+4BizhohSZ4yDteziPw43_uF8nPXPWxUVChzw@mail.gmail.com
-Reviewed-by: Jann Horn <jannh@google.com>
-Reviewed-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Acked-by: David Hildenbrand <david@redhat.com>
-Reviewed-by: Shakeel Butt <shakeel.butt@linux.dev>
-Reviewed-by: Barry Song <baohua@kernel.org>
-Cc: Liam Howlett <liam.howlett@oracle.com>
-Cc: Vlastimil Babka <vbabka@suse.cz>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- mm/madvise.c | 5 ++++-
- 1 file changed, 4 insertions(+), 1 deletion(-)
-
--- a/mm/madvise.c
-+++ b/mm/madvise.c
-@@ -1830,7 +1830,9 @@ static ssize_t vector_madvise(struct mm_
- 
- 			/* Drop and reacquire lock to unwind race. */
- 			madvise_unlock(mm, behavior);
-			madvise_lock(mm, behavior);
-+			ret = madvise_lock(mm, behavior);
-+			if (ret)
-+				goto out;
- 			continue;
- 		}
- 		if (ret < 0)
-@@ -1839,6 +1841,7 @@ static ssize_t vector_madvise(struct mm_
- 	}
- 	madvise_unlock(mm, behavior);
- 
-+out:
- 	ret = (total_len - iov_iter_count(iter)) ? : ret;
- 
- 	return ret;
--- a/debian/patches/patchset-pf/fixes/0019-video-screen_info-Relocate-framebuffers-behind-PCI-b.patch
+++ b/debian/patches/patchset-pf/fixes/0019-video-screen_info-Relocate-framebuffers-behind-PCI-b.patch
@@ -1,164 +0,0 @@
-From f0ab226d0eae3aa7e26524efc040026a65ead640 Mon Sep 17 00:00:00 2001
-From: Thomas Zimmermann <tzimmermann@suse.de>
-Date: Wed, 28 May 2025 10:02:08 +0200
-Subject: video: screen_info: Relocate framebuffers behind PCI bridges
-
-Apply PCI host-bridge window offsets to screen_info framebuffers. Fixes
-invalid access to I/O memory.
-
-Resources behind a PCI host bridge can be relocated by a certain offset
-in the kernel's CPU address range used for I/O. The framebuffer memory
-range stored in screen_info refers to the CPU addresses as seen during
-boot (where the offset is 0). During boot up, firmware may assign a
-different memory offset to the PCI host bridge and thereby relocating
-the framebuffer address of the PCI graphics device as seen by the kernel.
-The information in screen_info must be updated as well.
-
-The helper pcibios_bus_to_resource() performs the relocation of the
-screen_info's framebuffer resource (given in PCI bus addresses). The
-result matches the I/O-memory resource of the PCI graphics device (given
-in CPU addresses). As before, we store away the information necessary to
-later update the information in screen_info itself.
-
-Commit 78aa89d1dfba ("firmware/sysfb: Update screen_info for relocated
-EFI framebuffers") added the code for updating screen_info. It is based
-on similar functionality that pre-existed in efifb. Efifb uses a pointer
-to the PCI resource, while the newer code does a memcpy of the region.
-Hence efifb sees any updates to the PCI resource and avoids the issue.
-
-v3:
- Only use struct pci_bus_region for PCI bus addresses (Bjorn)
- Clarify address semantics in commit messages and comments (Bjorn)
-v2:
- Fixed tags (Takashi, Ivan)
- Updated information on efifb
-
-Signed-off-by: Thomas Zimmermann <tzimmermann@suse.de>
-Reviewed-by: Javier Martinez Canillas <javierm@redhat.com>
-Reported-by: "Ivan T. Ivanov" <iivanov@suse.de>
-Closes: https://bugzilla.suse.com/show_bug.cgi?id=1240696
-Tested-by: "Ivan T. Ivanov" <iivanov@suse.de>
-Fixes: 78aa89d1dfba ("firmware/sysfb: Update screen_info for relocated EFI framebuffers")
-Cc: dri-devel@lists.freedesktop.org
-Cc: <stable@vger.kernel.org> # v6.9+
-Link: https://lore.kernel.org/r/20250528080234.7380-1-tzimmermann@suse.de
---
- drivers/video/screen_info_pci.c | 79 +++++++++++++++++++++------------
- 1 file changed, 50 insertions(+), 29 deletions(-)
-
--- a/drivers/video/screen_info_pci.c
-+++ b/drivers/video/screen_info_pci.c
-@@ -7,8 +7,8 @@
- 
- static struct pci_dev *screen_info_lfb_pdev;
- static size_t screen_info_lfb_bar;
-static resource_size_t screen_info_lfb_offset;
-static struct resource screen_info_lfb_res = DEFINE_RES_MEM(0, 0);
-+static resource_size_t screen_info_lfb_res_start; // original start of resource
-+static resource_size_t screen_info_lfb_offset; // framebuffer offset within resource
- 
- static bool __screen_info_relocation_is_valid(const struct screen_info *si, struct resource *pr)
- {
-@@ -31,7 +31,7 @@ void screen_info_apply_fixups(void)
- 	if (screen_info_lfb_pdev) {
- 		struct resource *pr = &screen_info_lfb_pdev->resource[screen_info_lfb_bar];
- 
-		if (pr->start != screen_info_lfb_res.start) {
-+		if (pr->start != screen_info_lfb_res_start) {
- 			if (__screen_info_relocation_is_valid(si, pr)) {
- 				/*
- 				 * Only update base if we have an actual
-@@ -47,46 +47,67 @@ void screen_info_apply_fixups(void)
- 	}
- }
- 
-+static int __screen_info_lfb_pci_bus_region(const struct screen_info *si, unsigned int type,
-+					    struct pci_bus_region *r)
-+{
-+	u64 base, size;
-+
-+	base = __screen_info_lfb_base(si);
-+	if (!base)
-+		return -EINVAL;
-+
-+	size = __screen_info_lfb_size(si, type);
-+	if (!size)
-+		return -EINVAL;
-+
-+	r->start = base;
-+	r->end = base + size - 1;
-+
-+	return 0;
-+}
-+
- static void screen_info_fixup_lfb(struct pci_dev *pdev)
- {
- 	unsigned int type;
-	struct resource res[SCREEN_INFO_MAX_RESOURCES];
-	size_t i, numres;
-+	struct pci_bus_region bus_region;
- 	int ret;
-+	struct resource r = {
-+		.flags = IORESOURCE_MEM,
-+	};
-+	const struct resource *pr;
- 	const struct screen_info *si = &screen_info;
- 
- 	if (screen_info_lfb_pdev)
- 		return; // already found
- 
- 	type = screen_info_video_type(si);
-	if (type != VIDEO_TYPE_EFI)
-		return; // only applies to EFI
-+	if (!__screen_info_has_lfb(type))
-+		return; // only applies to EFI; maybe VESA
- 
-	ret = screen_info_resources(si, res, ARRAY_SIZE(res));
-+	ret = __screen_info_lfb_pci_bus_region(si, type, &bus_region);
- 	if (ret < 0)
- 		return;
-	numres = ret;
- 
-	for (i = 0; i < numres; ++i) {
-		struct resource *r = &res[i];
-		const struct resource *pr;
-
-		if (!(r->flags & IORESOURCE_MEM))
-			continue;
-		pr = pci_find_resource(pdev, r);
-		if (!pr)
-			continue;
-
-		/*
-		 * We've found a PCI device with the framebuffer
-		 * resource. Store away the parameters to track
-		 * relocation of the framebuffer aperture.
-		 */
-		screen_info_lfb_pdev = pdev;
-		screen_info_lfb_bar = pr - pdev->resource;
-		screen_info_lfb_offset = r->start - pr->start;
-		memcpy(&screen_info_lfb_res, r, sizeof(screen_info_lfb_res));
-	}
-+	/*
-+	 * Translate the PCI bus address to resource. Account
-+	 * for an offset if the framebuffer is behind a PCI host
-+	 * bridge.
-+	 */
-+	pcibios_bus_to_resource(pdev->bus, &r, &bus_region);
-+
-+	pr = pci_find_resource(pdev, &r);
-+	if (!pr)
-+		return;
-+
-+	/*
-+	 * We've found a PCI device with the framebuffer
-+	 * resource. Store away the parameters to track
-+	 * relocation of the framebuffer aperture.
-+	 */
-+	screen_info_lfb_pdev = pdev;
-+	screen_info_lfb_bar = pr - pdev->resource;
-+	screen_info_lfb_offset = r.start - pr->start;
-+	screen_info_lfb_res_start = bus_region.start;
- }
- DECLARE_PCI_FIXUP_CLASS_HEADER(PCI_ANY_ID, PCI_ANY_ID, PCI_BASE_CLASS_DISPLAY, 16,
- 			       screen_info_fixup_lfb);
--- a/debian/patches/patchset-pf/fixes/0020-sysfb-Fix-screen_info-type-check-for-VGA.patch
+++ b/debian/patches/patchset-pf/fixes/0020-sysfb-Fix-screen_info-type-check-for-VGA.patch
@@ -1,86 +0,0 @@
-From 717bcb42b8cd4119c88249fbfc26d08e25a2ca24 Mon Sep 17 00:00:00 2001
-From: Thomas Zimmermann <tzimmermann@suse.de>
-Date: Tue, 3 Jun 2025 17:48:20 +0200
-Subject: sysfb: Fix screen_info type check for VGA
-MIME-Version: 1.0
-Content-Type: text/plain; charset=UTF-8
-Content-Transfer-Encoding: 8bit
-
-Use the helper screen_info_video_type() to get the framebuffer
-type from struct screen_info. Handle supported values in sorted
-switch statement.
-
-Reading orig_video_isVGA is unreliable. On most systems it is a
-VIDEO_TYPE_ constant. On some systems with VGA it is simply set
-to 1 to signal the presence of a VGA output. See vga_probe() for
-an example. Retrieving the screen_info type with the helper
-screen_info_video_type() detects these cases and returns the
-appropriate VIDEO_TYPE_ constant. For VGA, sysfb creates a device
-named "vga-framebuffer".
-
-The sysfb code has been taken from vga16fb, where it likely didn't
-work correctly either. With this bugfix applied, vga16fb loads for
-compatible vga-framebuffer devices.
-
-Fixes: 0db5b61e0dc0 ("fbdev/vga16fb: Create EGA/VGA devices in sysfb code")
-Cc: Thomas Zimmermann <tzimmermann@suse.de>
-Cc: Javier Martinez Canillas <javierm@redhat.com>
-Cc: Alex Deucher <alexander.deucher@amd.com>
-Cc: Tzung-Bi Shih <tzungbi@kernel.org>
-Cc: Helge Deller <deller@gmx.de>
-Cc: "Uwe Kleine-König" <u.kleine-koenig@baylibre.com>
-Cc: Zsolt Kajtar <soci@c64.rulez.org>
-Cc: <stable@vger.kernel.org> # v6.1+
-Signed-off-by: Thomas Zimmermann <tzimmermann@suse.de>
-Reviewed-by: Tzung-Bi Shih <tzungbi@kernel.org>
-Reviewed-by: Javier Martinez Canillas <javierm@redhat.com>
-Link: https://lore.kernel.org/r/20250603154838.401882-1-tzimmermann@suse.de
---
- drivers/firmware/sysfb.c | 26 ++++++++++++++++++--------
- 1 file changed, 18 insertions(+), 8 deletions(-)
-
--- a/drivers/firmware/sysfb.c
-+++ b/drivers/firmware/sysfb.c
-@@ -143,6 +143,7 @@ static __init int sysfb_init(void)
- {
- 	struct screen_info *si = &screen_info;
- 	struct device *parent;
-+	unsigned int type;
- 	struct simplefb_platform_data mode;
- 	const char *name;
- 	bool compatible;
-@@ -170,17 +171,26 @@ static __init int sysfb_init(void)
- 			goto put_device;
- 	}
- 
-+	type = screen_info_video_type(si);
-+
- 	/* if the FB is incompatible, create a legacy framebuffer device */
-	if (si->orig_video_isVGA == VIDEO_TYPE_EFI)
-		name = "efi-framebuffer";
-	else if (si->orig_video_isVGA == VIDEO_TYPE_VLFB)
-		name = "vesa-framebuffer";
-	else if (si->orig_video_isVGA == VIDEO_TYPE_VGAC)
-		name = "vga-framebuffer";
-	else if (si->orig_video_isVGA == VIDEO_TYPE_EGAC)
-+	switch (type) {
-+	case VIDEO_TYPE_EGAC:
- 		name = "ega-framebuffer";
-	else
-+		break;
-+	case VIDEO_TYPE_VGAC:
-+		name = "vga-framebuffer";
-+		break;
-+	case VIDEO_TYPE_VLFB:
-+		name = "vesa-framebuffer";
-+		break;
-+	case VIDEO_TYPE_EFI:
-+		name = "efi-framebuffer";
-+		break;
-+	default:
- 		name = "platform-framebuffer";
-+		break;
-+	}
- 
- 	pd = platform_device_alloc(name, 0);
- 	if (!pd) {
--- a/debian/patches/patchset-pf/fixes/0021-watchdog-fix-watchdog-may-detect-false-positive-of-s.patch
+++ b/debian/patches/patchset-pf/fixes/0021-watchdog-fix-watchdog-may-detect-false-positive-of-s.patch
@@ -1,200 +0,0 @@
-From 08b1e02fc44abc04d813dbc827812db9ebca0dad Mon Sep 17 00:00:00 2001
-From: Luo Gengkun <luogengkun@huaweicloud.com>
-Date: Mon, 21 Apr 2025 03:50:21 +0000
-Subject: watchdog: fix watchdog may detect false positive of softlockup
-
-When updating `watchdog_thresh`, there is a race condition between writing
-the new `watchdog_thresh` value and stopping the old watchdog timer.  If
-the old timer triggers during this window, it may falsely detect a
-softlockup due to the old interval and the new `watchdog_thresh` value
-being used.  The problem can be described as follow:
-
- # We asuume previous watchdog_thresh is 60, so the watchdog timer is
- # coming every 24s.
-echo 10 > /proc/sys/kernel/watchdog_thresh (User space)
-|
-+------>+ update watchdog_thresh (We are in kernel now)
-	|
-	|	  # using old interval and new `watchdog_thresh`
-	+------>+ watchdog hrtimer (irq context: detect softlockup)
-		|
-		|
-	+-------+
-	|
-	|
-	+ softlockup_stop_all
-
-To fix this problem, introduce a shadow variable for `watchdog_thresh`.
-The update to the actual `watchdog_thresh` is delayed until after the old
-timer is stopped, preventing false positives.
-
-The following testcase may help to understand this problem.
-
---------------------------------------------
-echo RT_RUNTIME_SHARE > /sys/kernel/debug/sched/features
-echo -1 > /proc/sys/kernel/sched_rt_runtime_us
-echo 0 > /sys/kernel/debug/sched/fair_server/cpu3/runtime
-echo 60 > /proc/sys/kernel/watchdog_thresh
-taskset -c 3 chrt -r 99 /bin/bash -c "while true;do true; done" &
-echo 10 > /proc/sys/kernel/watchdog_thresh &
---------------------------------------------
-
-The test case above first removes the throttling restrictions for
-real-time tasks.  It then sets watchdog_thresh to 60 and executes a
-real-time task ,a simple while(1) loop, on cpu3.  Consequently, the final
-command gets blocked because the presence of this real-time thread
-prevents kworker:3 from being selected by the scheduler.  This eventually
-triggers a softlockup detection on cpu3 due to watchdog_timer_fn operating
-with inconsistent variable - using both the old interval and the updated
-watchdog_thresh simultaneously.
-
-[nysal@linux.ibm.com: fix the SOFTLOCKUP_DETECTOR=n case]
-  Link: https://lkml.kernel.org/r/20250502111120.282690-1-nysal@linux.ibm.com
-Link: https://lkml.kernel.org/r/20250421035021.3507649-1-luogengkun@huaweicloud.com
-Signed-off-by: Luo Gengkun <luogengkun@huaweicloud.com>
-Signed-off-by: Nysal Jan K.A. <nysal@linux.ibm.com>
-Cc: Doug Anderson <dianders@chromium.org>
-Cc: Joel Granados <joel.granados@kernel.org>
-Cc: Song Liu <song@kernel.org>
-Cc: Thomas Gleinxer <tglx@linutronix.de>
-Cc: "Nysal Jan K.A." <nysal@linux.ibm.com>
-Cc: Venkat Rao Bagalkote <venkat88@linux.ibm.com>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- kernel/watchdog.c | 41 +++++++++++++++++++++++++++--------------
- 1 file changed, 27 insertions(+), 14 deletions(-)
-
--- a/kernel/watchdog.c
-+++ b/kernel/watchdog.c
-@@ -47,6 +47,7 @@ int __read_mostly watchdog_user_enabled
- static int __read_mostly watchdog_hardlockup_user_enabled = WATCHDOG_HARDLOCKUP_DEFAULT;
- static int __read_mostly watchdog_softlockup_user_enabled = 1;
- int __read_mostly watchdog_thresh = 10;
-+static int __read_mostly watchdog_thresh_next;
- static int __read_mostly watchdog_hardlockup_available;
- 
- struct cpumask watchdog_cpumask __read_mostly;
-@@ -870,12 +871,20 @@ int lockup_detector_offline_cpu(unsigned
- 	return 0;
- }
- 
-static void __lockup_detector_reconfigure(void)
-+static void __lockup_detector_reconfigure(bool thresh_changed)
- {
- 	cpus_read_lock();
- 	watchdog_hardlockup_stop();
- 
- 	softlockup_stop_all();
-+	/*
-+	 * To prevent watchdog_timer_fn from using the old interval and
-+	 * the new watchdog_thresh at the same time, which could lead to
-+	 * false softlockup reports, it is necessary to update the
-+	 * watchdog_thresh after the softlockup is completed.
-+	 */
-+	if (thresh_changed)
-+		watchdog_thresh = READ_ONCE(watchdog_thresh_next);
- 	set_sample_period();
- 	lockup_detector_update_enable();
- 	if (watchdog_enabled && watchdog_thresh)
-@@ -888,7 +897,7 @@ static void __lockup_detector_reconfigur
- void lockup_detector_reconfigure(void)
- {
- 	mutex_lock(&watchdog_mutex);
-	__lockup_detector_reconfigure();
-+	__lockup_detector_reconfigure(false);
- 	mutex_unlock(&watchdog_mutex);
- }
- 
-@@ -908,27 +917,29 @@ static __init void lockup_detector_setup
- 		return;
- 
- 	mutex_lock(&watchdog_mutex);
-	__lockup_detector_reconfigure();
-+	__lockup_detector_reconfigure(false);
- 	softlockup_initialized = true;
- 	mutex_unlock(&watchdog_mutex);
- }
- 
- #else /* CONFIG_SOFTLOCKUP_DETECTOR */
-static void __lockup_detector_reconfigure(void)
-+static void __lockup_detector_reconfigure(bool thresh_changed)
- {
- 	cpus_read_lock();
- 	watchdog_hardlockup_stop();
-+	if (thresh_changed)
-+		watchdog_thresh = READ_ONCE(watchdog_thresh_next);
- 	lockup_detector_update_enable();
- 	watchdog_hardlockup_start();
- 	cpus_read_unlock();
- }
- void lockup_detector_reconfigure(void)
- {
-	__lockup_detector_reconfigure();
-+	__lockup_detector_reconfigure(false);
- }
- static inline void lockup_detector_setup(void)
- {
-	__lockup_detector_reconfigure();
-+	__lockup_detector_reconfigure(false);
- }
- #endif /* !CONFIG_SOFTLOCKUP_DETECTOR */
- 
-@@ -946,11 +957,11 @@ void lockup_detector_soft_poweroff(void)
- #ifdef CONFIG_SYSCTL
- 
- /* Propagate any changes to the watchdog infrastructure */
-static void proc_watchdog_update(void)
-+static void proc_watchdog_update(bool thresh_changed)
- {
- 	/* Remove impossible cpus to keep sysctl output clean. */
- 	cpumask_and(&watchdog_cpumask, &watchdog_cpumask, cpu_possible_mask);
-	__lockup_detector_reconfigure();
-+	__lockup_detector_reconfigure(thresh_changed);
- }
- 
- /*
-@@ -984,7 +995,7 @@ static int proc_watchdog_common(int whic
- 	} else {
- 		err = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
- 		if (!err && old != READ_ONCE(*param))
-			proc_watchdog_update();
-+			proc_watchdog_update(false);
- 	}
- 	mutex_unlock(&watchdog_mutex);
- 	return err;
-@@ -1035,11 +1046,13 @@ static int proc_watchdog_thresh(const st
- 
- 	mutex_lock(&watchdog_mutex);
- 
-	old = READ_ONCE(watchdog_thresh);
-+	watchdog_thresh_next = READ_ONCE(watchdog_thresh);
-+
-+	old = watchdog_thresh_next;
- 	err = proc_dointvec_minmax(table, write, buffer, lenp, ppos);
- 
-	if (!err && write && old != READ_ONCE(watchdog_thresh))
-		proc_watchdog_update();
-+	if (!err && write && old != READ_ONCE(watchdog_thresh_next))
-+		proc_watchdog_update(true);
- 
- 	mutex_unlock(&watchdog_mutex);
- 	return err;
-@@ -1060,7 +1073,7 @@ static int proc_watchdog_cpumask(const s
- 
- 	err = proc_do_large_bitmap(table, write, buffer, lenp, ppos);
- 	if (!err && write)
-		proc_watchdog_update();
-+		proc_watchdog_update(false);
- 
- 	mutex_unlock(&watchdog_mutex);
- 	return err;
-@@ -1080,7 +1093,7 @@ static const struct ctl_table watchdog_s
- 	},
- 	{
- 		.procname	= "watchdog_thresh",
-		.data		= &watchdog_thresh,
-+		.data		= &watchdog_thresh_next,
- 		.maxlen		= sizeof(int),
- 		.mode		= 0644,
- 		.proc_handler	= proc_watchdog_thresh,
--- a/debian/patches/patchset-pf/fixes/0022-sched-rt-Fix-race-in-push_rt_task.patch
+++ b/debian/patches/patchset-pf/fixes/0022-sched-rt-Fix-race-in-push_rt_task.patch
@@ -1,288 +0,0 @@
-From ff8503c4997332bb5708c3b77f8a19f334e947a9 Mon Sep 17 00:00:00 2001
-From: Harshit Agarwal <harshit@nutanix.com>
-Date: Tue, 25 Feb 2025 18:05:53 +0000
-Subject: sched/rt: Fix race in push_rt_task
-MIME-Version: 1.0
-Content-Type: text/plain; charset=UTF-8
-Content-Transfer-Encoding: 8bit
-
-Overview
-========
-When a CPU chooses to call push_rt_task and picks a task to push to
-another CPU's runqueue then it will call find_lock_lowest_rq method
-which would take a double lock on both CPUs' runqueues. If one of the
-locks aren't readily available, it may lead to dropping the current
-runqueue lock and reacquiring both the locks at once. During this window
-it is possible that the task is already migrated and is running on some
-other CPU. These cases are already handled. However, if the task is
-migrated and has already been executed and another CPU is now trying to
-wake it up (ttwu) such that it is queued again on the runqeue
-(on_rq is 1) and also if the task was run by the same CPU, then the
-current checks will pass even though the task was migrated out and is no
-longer in the pushable tasks list.
-
-Crashes
-=======
-This bug resulted in quite a few flavors of crashes triggering kernel
-panics with various crash signatures such as assert failures, page
-faults, null pointer dereferences, and queue corruption errors all
-coming from scheduler itself.
-
-Some of the crashes:
-> kernel BUG at kernel/sched/rt.c:1616! BUG_ON(idx >= MAX_RT_PRIO)
-   Call Trace:
-   ? __die_body+0x1a/0x60
-   ? die+0x2a/0x50
-   ? do_trap+0x85/0x100
-   ? pick_next_task_rt+0x6e/0x1d0
-   ? do_error_trap+0x64/0xa0
-   ? pick_next_task_rt+0x6e/0x1d0
-   ? exc_invalid_op+0x4c/0x60
-   ? pick_next_task_rt+0x6e/0x1d0
-   ? asm_exc_invalid_op+0x12/0x20
-   ? pick_next_task_rt+0x6e/0x1d0
-   __schedule+0x5cb/0x790
-   ? update_ts_time_stats+0x55/0x70
-   schedule_idle+0x1e/0x40
-   do_idle+0x15e/0x200
-   cpu_startup_entry+0x19/0x20
-   start_secondary+0x117/0x160
-   secondary_startup_64_no_verify+0xb0/0xbb
-
-> BUG: kernel NULL pointer dereference, address: 00000000000000c0
-   Call Trace:
-   ? __die_body+0x1a/0x60
-   ? no_context+0x183/0x350
-   ? __warn+0x8a/0xe0
-   ? exc_page_fault+0x3d6/0x520
-   ? asm_exc_page_fault+0x1e/0x30
-   ? pick_next_task_rt+0xb5/0x1d0
-   ? pick_next_task_rt+0x8c/0x1d0
-   __schedule+0x583/0x7e0
-   ? update_ts_time_stats+0x55/0x70
-   schedule_idle+0x1e/0x40
-   do_idle+0x15e/0x200
-   cpu_startup_entry+0x19/0x20
-   start_secondary+0x117/0x160
-   secondary_startup_64_no_verify+0xb0/0xbb
-
-> BUG: unable to handle page fault for address: ffff9464daea5900
-   kernel BUG at kernel/sched/rt.c:1861! BUG_ON(rq->cpu != task_cpu(p))
-
-> kernel BUG at kernel/sched/rt.c:1055! BUG_ON(!rq->nr_running)
-   Call Trace:
-   ? __die_body+0x1a/0x60
-   ? die+0x2a/0x50
-   ? do_trap+0x85/0x100
-   ? dequeue_top_rt_rq+0xa2/0xb0
-   ? do_error_trap+0x64/0xa0
-   ? dequeue_top_rt_rq+0xa2/0xb0
-   ? exc_invalid_op+0x4c/0x60
-   ? dequeue_top_rt_rq+0xa2/0xb0
-   ? asm_exc_invalid_op+0x12/0x20
-   ? dequeue_top_rt_rq+0xa2/0xb0
-   dequeue_rt_entity+0x1f/0x70
-   dequeue_task_rt+0x2d/0x70
-   __schedule+0x1a8/0x7e0
-   ? blk_finish_plug+0x25/0x40
-   schedule+0x3c/0xb0
-   futex_wait_queue_me+0xb6/0x120
-   futex_wait+0xd9/0x240
-   do_futex+0x344/0xa90
-   ? get_mm_exe_file+0x30/0x60
-   ? audit_exe_compare+0x58/0x70
-   ? audit_filter_rules.constprop.26+0x65e/0x1220
-   __x64_sys_futex+0x148/0x1f0
-   do_syscall_64+0x30/0x80
-   entry_SYSCALL_64_after_hwframe+0x62/0xc7
-
-> BUG: unable to handle page fault for address: ffff8cf3608bc2c0
-   Call Trace:
-   ? __die_body+0x1a/0x60
-   ? no_context+0x183/0x350
-   ? spurious_kernel_fault+0x171/0x1c0
-   ? exc_page_fault+0x3b6/0x520
-   ? plist_check_list+0x15/0x40
-   ? plist_check_list+0x2e/0x40
-   ? asm_exc_page_fault+0x1e/0x30
-   ? _cond_resched+0x15/0x30
-   ? futex_wait_queue_me+0xc8/0x120
-   ? futex_wait+0xd9/0x240
-   ? try_to_wake_up+0x1b8/0x490
-   ? futex_wake+0x78/0x160
-   ? do_futex+0xcd/0xa90
-   ? plist_check_list+0x15/0x40
-   ? plist_check_list+0x2e/0x40
-   ? plist_del+0x6a/0xd0
-   ? plist_check_list+0x15/0x40
-   ? plist_check_list+0x2e/0x40
-   ? dequeue_pushable_task+0x20/0x70
-   ? __schedule+0x382/0x7e0
-   ? asm_sysvec_reschedule_ipi+0xa/0x20
-   ? schedule+0x3c/0xb0
-   ? exit_to_user_mode_prepare+0x9e/0x150
-   ? irqentry_exit_to_user_mode+0x5/0x30
-   ? asm_sysvec_reschedule_ipi+0x12/0x20
-
-Above are some of the common examples of the crashes that were observed
-due to this issue.
-
-Details
-=======
-Let's look at the following scenario to understand this race.
-
-1) CPU A enters push_rt_task
-  a) CPU A has chosen next_task = task p.
-  b) CPU A calls find_lock_lowest_rq(Task p, CPU Z’s rq).
-  c) CPU A identifies CPU X as a destination CPU (X < Z).
-  d) CPU A enters double_lock_balance(CPU Z’s rq, CPU X’s rq).
-  e) Since X is lower than Z, CPU A unlocks CPU Z’s rq. Someone else has
-     locked CPU X’s rq, and thus, CPU A must wait.
-
-2) At CPU Z
-  a) Previous task has completed execution and thus, CPU Z enters
-     schedule, locks its own rq after CPU A releases it.
-  b) CPU Z dequeues previous task and begins executing task p.
-  c) CPU Z unlocks its rq.
-  d) Task p yields the CPU (ex. by doing IO or waiting to acquire a
-     lock) which triggers the schedule function on CPU Z.
-  e) CPU Z enters schedule again, locks its own rq, and dequeues task p.
-  f) As part of dequeue, it sets p.on_rq = 0 and unlocks its rq.
-
-3) At CPU B
-  a) CPU B enters try_to_wake_up with input task p.
-  b) Since CPU Z dequeued task p, p.on_rq = 0, and CPU B updates
-     B.state = WAKING.
-  c) CPU B via select_task_rq determines CPU Y as the target CPU.
-
-4) The race
-  a) CPU A acquires CPU X’s lock and relocks CPU Z.
-  b) CPU A reads task p.cpu = Z and incorrectly concludes task p is
-     still on CPU Z.
-  c) CPU A failed to notice task p had been dequeued from CPU Z while
-     CPU A was waiting for locks in double_lock_balance. If CPU A knew
-     that task p had been dequeued, it would return NULL forcing
-     push_rt_task to give up the task p's migration.
-  d) CPU B updates task p.cpu = Y and calls ttwu_queue.
-  e) CPU B locks Ys rq. CPU B enqueues task p onto Y and sets task
-     p.on_rq = 1.
-  f) CPU B unlocks CPU Y, triggering memory synchronization.
-  g) CPU A reads task p.on_rq = 1, cementing its assumption that task p
-     has not migrated.
-  h) CPU A decides to migrate p to CPU X.
-
-This leads to A dequeuing p from Y's queue and various crashes down the
-line.
-
-Solution
-========
-The solution here is fairly simple. After obtaining the lock (at 4a),
-the check is enhanced to make sure that the task is still at the head of
-the pushable tasks list. If not, then it is anyway not suitable for
-being pushed out.
-
-Testing
-=======
-The fix is tested on a cluster of 3 nodes, where the panics due to this
-are hit every couple of days. A fix similar to this was deployed on such
-cluster and was stable for more than 30 days.
-
-Co-developed-by: Jon Kohler <jon@nutanix.com>
-Signed-off-by: Jon Kohler <jon@nutanix.com>
-Co-developed-by: Gauri Patwardhan <gauri.patwardhan@nutanix.com>
-Signed-off-by: Gauri Patwardhan <gauri.patwardhan@nutanix.com>
-Co-developed-by: Rahul Chunduru <rahul.chunduru@nutanix.com>
-Signed-off-by: Rahul Chunduru <rahul.chunduru@nutanix.com>
-Signed-off-by: Harshit Agarwal <harshit@nutanix.com>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Reviewed-by: "Steven Rostedt (Google)" <rostedt@goodmis.org>
-Reviewed-by: Phil Auld <pauld@redhat.com>
-Tested-by: Will Ton <william.ton@nutanix.com>
-Cc: stable@vger.kernel.org
-Link: https://lore.kernel.org/r/20250225180553.167995-1-harshit@nutanix.com
---
- kernel/sched/rt.c | 54 +++++++++++++++++++++++------------------------
- 1 file changed, 26 insertions(+), 28 deletions(-)
-
--- a/kernel/sched/rt.c
-+++ b/kernel/sched/rt.c
-@@ -1883,6 +1883,27 @@ static int find_lowest_rq(struct task_st
- 	return -1;
- }
- 
-+static struct task_struct *pick_next_pushable_task(struct rq *rq)
-+{
-+	struct task_struct *p;
-+
-+	if (!has_pushable_tasks(rq))
-+		return NULL;
-+
-+	p = plist_first_entry(&rq->rt.pushable_tasks,
-+			      struct task_struct, pushable_tasks);
-+
-+	BUG_ON(rq->cpu != task_cpu(p));
-+	BUG_ON(task_current(rq, p));
-+	BUG_ON(task_current_donor(rq, p));
-+	BUG_ON(p->nr_cpus_allowed <= 1);
-+
-+	BUG_ON(!task_on_rq_queued(p));
-+	BUG_ON(!rt_task(p));
-+
-+	return p;
-+}
-+
- /* Will lock the rq it finds */
- static struct rq *find_lock_lowest_rq(struct task_struct *task, struct rq *rq)
- {
-@@ -1913,18 +1934,16 @@ static struct rq *find_lock_lowest_rq(st
- 			/*
- 			 * We had to unlock the run queue. In
- 			 * the mean time, task could have
-			 * migrated already or had its affinity changed.
-			 * Also make sure that it wasn't scheduled on its rq.
-+			 * migrated already or had its affinity changed,
-+			 * therefore check if the task is still at the
-+			 * head of the pushable tasks list.
- 			 * It is possible the task was scheduled, set
- 			 * "migrate_disabled" and then got preempted, so we must
- 			 * check the task migration disable flag here too.
- 			 */
-			if (unlikely(task_rq(task) != rq ||
-+			if (unlikely(is_migration_disabled(task) ||
- 				     !cpumask_test_cpu(lowest_rq->cpu, &task->cpus_mask) ||
-				     task_on_cpu(rq, task) ||
-				     !rt_task(task) ||
-				     is_migration_disabled(task) ||
-				     !task_on_rq_queued(task))) {
-+				     task != pick_next_pushable_task(rq))) {
- 
- 				double_unlock_balance(rq, lowest_rq);
- 				lowest_rq = NULL;
-@@ -1944,27 +1963,6 @@ static struct rq *find_lock_lowest_rq(st
- 	return lowest_rq;
- }
- 
-static struct task_struct *pick_next_pushable_task(struct rq *rq)
-{
-	struct task_struct *p;
-
-	if (!has_pushable_tasks(rq))
-		return NULL;
-
-	p = plist_first_entry(&rq->rt.pushable_tasks,
-			      struct task_struct, pushable_tasks);
-
-	BUG_ON(rq->cpu != task_cpu(p));
-	BUG_ON(task_current(rq, p));
-	BUG_ON(task_current_donor(rq, p));
-	BUG_ON(p->nr_cpus_allowed <= 1);
-
-	BUG_ON(!task_on_rq_queued(p));
-	BUG_ON(!rt_task(p));
-
-	return p;
-}
-
- /*
-  * If the current CPU has more than one RT task, see if the non
-  * running task can migrate over to a CPU that is running a task
--- a/debian/patches/patchset-pf/fixes/0023-sched-fair-Adhere-to-place_entity-constraints.patch
+++ b/debian/patches/patchset-pf/fixes/0023-sched-fair-Adhere-to-place_entity-constraints.patch
@@ -1,62 +0,0 @@
-From e02cbdc12bf63da363d7e3391376819241d67fbe Mon Sep 17 00:00:00 2001
-From: Peter Zijlstra <peterz@infradead.org>
-Date: Tue, 28 Jan 2025 15:39:49 +0100
-Subject: sched/fair: Adhere to place_entity() constraints
-
-Mike reports that commit 6d71a9c61604 ("sched/fair: Fix EEVDF entity
-placement bug causing scheduling lag") relies on commit 4423af84b297
-("sched/fair: optimize the PLACE_LAG when se->vlag is zero") to not
-trip a WARN in place_entity().
-
-What happens is that the lag of the very last entity is 0 per
-definition -- the average of one element matches the value of that
-element. Therefore place_entity() will match the condition skipping
-the lag adjustment:
-
-  if (sched_feat(PLACE_LAG) && cfs_rq->nr_queued && se->vlag) {
-
-Without the 'se->vlag' condition -- it will attempt to adjust the zero
-lag even though we're inserting into an empty tree.
-
-Notably, we should have failed the 'cfs_rq->nr_queued' condition, but
-don't because they didn't get updated.
-
-Additionally, move update_load_add() after placement() as is
-consistent with other place_entity() users -- this change is
-non-functional, place_entity() does not use cfs_rq->load.
-
-Fixes: 6d71a9c61604 ("sched/fair: Fix EEVDF entity placement bug causing scheduling lag")
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Reported-by: Mike Galbraith <efault@gmx.de>
-Signed-off-by: "Peter Zijlstra (Intel)" <peterz@infradead.org>
-Signed-off-by: Mike Galbraith <efault@gmx.de>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Cc: stable@vger.kernel.org
-Link: https://lore.kernel.org/r/c216eb4ef0e0e0029c600aefc69d56681cee5581.camel@gmx.de
---
- kernel/sched/fair.c | 4 +++-
- 1 file changed, 3 insertions(+), 1 deletion(-)
-
--- a/kernel/sched/fair.c
-+++ b/kernel/sched/fair.c
-@@ -3808,6 +3808,7 @@ static void reweight_entity(struct cfs_r
- 		update_entity_lag(cfs_rq, se);
- 		se->deadline -= se->vruntime;
- 		se->rel_deadline = 1;
-+		cfs_rq->nr_queued--;
- 		if (!curr)
- 			__dequeue_entity(cfs_rq, se);
- 		update_load_sub(&cfs_rq->load, se->load.weight);
-@@ -3834,10 +3835,11 @@ static void reweight_entity(struct cfs_r
- 
- 	enqueue_load_avg(cfs_rq, se);
- 	if (se->on_rq) {
-		update_load_add(&cfs_rq->load, se->load.weight);
- 		place_entity(cfs_rq, se, 0);
-+		update_load_add(&cfs_rq->load, se->load.weight);
- 		if (!curr)
- 			__enqueue_entity(cfs_rq, se);
-+		cfs_rq->nr_queued++;
- 
- 		/*
- 		 * The entity's vruntime has been adjusted, so let's check
--- a/debian/patches/patchset-pf/fixes/0024-alloc_tag-handle-module-codetag-load-errors-as-modul.patch
+++ b/debian/patches/patchset-pf/fixes/0024-alloc_tag-handle-module-codetag-load-errors-as-modul.patch
@@ -1,184 +0,0 @@
-From 7257e4f8df6b5783978ab06063fc8529ee2631d5 Mon Sep 17 00:00:00 2001
-From: Suren Baghdasaryan <surenb@google.com>
-Date: Wed, 21 May 2025 09:06:02 -0700
-Subject: alloc_tag: handle module codetag load errors as module load failures
-
-Failures inside codetag_load_module() are currently ignored.  As a result
-an error there would not cause a module load failure and freeing of the
-associated resources.  Correct this behavior by propagating the error code
-to the caller and handling possible errors.  With this change, error to
-allocate percpu counters, which happens at this stage, will not be ignored
-and will cause a module load failure and freeing of resources.  With this
-change we also do not need to disable memory allocation profiling when
-this error happens, instead we fail to load the module.
-
-Link: https://lkml.kernel.org/r/20250521160602.1940771-1-surenb@google.com
-Fixes: 10075262888b ("alloc_tag: allocate percpu counters for module tags dynamically")
-Signed-off-by: Suren Baghdasaryan <surenb@google.com>
-Reported-by: Casey Chen <cachen@purestorage.com>
-Closes: https://lore.kernel.org/all/20250520231620.15259-1-cachen@purestorage.com/
-Cc: Daniel Gomez <da.gomez@samsung.com>
-Cc: David Wang <00107082@163.com>
-Cc: Kent Overstreet <kent.overstreet@linux.dev>
-Cc: Luis Chamberalin <mcgrof@kernel.org>
-Cc: Petr Pavlu <petr.pavlu@suse.com>
-Cc: Sami Tolvanen <samitolvanen@google.com>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- include/linux/codetag.h |  8 ++++----
- kernel/module/main.c    |  5 +++--
- lib/alloc_tag.c         | 12 +++++++-----
- lib/codetag.c           | 34 +++++++++++++++++++++++++---------
- 4 files changed, 39 insertions(+), 20 deletions(-)
-
--- a/include/linux/codetag.h
-+++ b/include/linux/codetag.h
-@@ -36,8 +36,8 @@ union codetag_ref {
- struct codetag_type_desc {
- 	const char *section;
- 	size_t tag_size;
-	void (*module_load)(struct module *mod,
-			    struct codetag *start, struct codetag *end);
-+	int (*module_load)(struct module *mod,
-+			   struct codetag *start, struct codetag *end);
- 	void (*module_unload)(struct module *mod,
- 			      struct codetag *start, struct codetag *end);
- #ifdef CONFIG_MODULES
-@@ -89,7 +89,7 @@ void *codetag_alloc_module_section(struc
- 				   unsigned long align);
- void codetag_free_module_sections(struct module *mod);
- void codetag_module_replaced(struct module *mod, struct module *new_mod);
-void codetag_load_module(struct module *mod);
-+int codetag_load_module(struct module *mod);
- void codetag_unload_module(struct module *mod);
- 
- #else /* defined(CONFIG_CODE_TAGGING) && defined(CONFIG_MODULES) */
-@@ -103,7 +103,7 @@ codetag_alloc_module_section(struct modu
- 			     unsigned long align) { return NULL; }
- static inline void codetag_free_module_sections(struct module *mod) {}
- static inline void codetag_module_replaced(struct module *mod, struct module *new_mod) {}
-static inline void codetag_load_module(struct module *mod) {}
-+static inline int codetag_load_module(struct module *mod) { return 0; }
- static inline void codetag_unload_module(struct module *mod) {}
- 
- #endif /* defined(CONFIG_CODE_TAGGING) && defined(CONFIG_MODULES) */
--- a/kernel/module/main.c
-+++ b/kernel/module/main.c
-@@ -3399,11 +3399,12 @@ static int load_module(struct load_info
- 			goto sysfs_cleanup;
- 	}
- 
-+	if (codetag_load_module(mod))
-+		goto sysfs_cleanup;
-+
- 	/* Get rid of temporary copy. */
- 	free_copy(info, flags);
- 
-	codetag_load_module(mod);
-
- 	/* Done! */
- 	trace_module_load(mod);
- 
--- a/lib/alloc_tag.c
-+++ b/lib/alloc_tag.c
-@@ -618,15 +618,16 @@ out:
- 	mas_unlock(&mas);
- }
- 
-static void load_module(struct module *mod, struct codetag *start, struct codetag *stop)
-+static int load_module(struct module *mod, struct codetag *start, struct codetag *stop)
- {
- 	/* Allocate module alloc_tag percpu counters */
- 	struct alloc_tag *start_tag;
- 	struct alloc_tag *stop_tag;
- 	struct alloc_tag *tag;
- 
-+	/* percpu counters for core allocations are already statically allocated */
- 	if (!mod)
-		return;
-+		return 0;
- 
- 	start_tag = ct_to_alloc_tag(start);
- 	stop_tag = ct_to_alloc_tag(stop);
-@@ -638,12 +639,13 @@ static void load_module(struct module *m
- 				free_percpu(tag->counters);
- 				tag->counters = NULL;
- 			}
-			shutdown_mem_profiling(true);
-			pr_err("Failed to allocate memory for allocation tag percpu counters in the module %s. Memory allocation profiling is disabled!\n",
-+			pr_err("Failed to allocate memory for allocation tag percpu counters in the module %s\n",
- 			       mod->name);
-			break;
-+			return -ENOMEM;
- 		}
- 	}
-+
-+	return 0;
- }
- 
- static void replace_module(struct module *mod, struct module *new_mod)
--- a/lib/codetag.c
-+++ b/lib/codetag.c
-@@ -167,6 +167,7 @@ static int codetag_module_init(struct co
- {
- 	struct codetag_range range;
- 	struct codetag_module *cmod;
-+	int mod_id;
- 	int err;
- 
- 	range = get_section_range(mod, cttype->desc.section);
-@@ -190,11 +191,20 @@ static int codetag_module_init(struct co
- 	cmod->range = range;
- 
- 	down_write(&cttype->mod_lock);
-	err = idr_alloc(&cttype->mod_idr, cmod, 0, 0, GFP_KERNEL);
-	if (err >= 0) {
-		cttype->count += range_size(cttype, &range);
-		if (cttype->desc.module_load)
-			cttype->desc.module_load(mod, range.start, range.stop);
-+	mod_id = idr_alloc(&cttype->mod_idr, cmod, 0, 0, GFP_KERNEL);
-+	if (mod_id >= 0) {
-+		if (cttype->desc.module_load) {
-+			err = cttype->desc.module_load(mod, range.start, range.stop);
-+			if (!err)
-+				cttype->count += range_size(cttype, &range);
-+			else
-+				idr_remove(&cttype->mod_idr, mod_id);
-+		} else {
-+			cttype->count += range_size(cttype, &range);
-+			err = 0;
-+		}
-+	} else {
-+		err = mod_id;
- 	}
- 	up_write(&cttype->mod_lock);
- 
-@@ -295,17 +305,23 @@ void codetag_module_replaced(struct modu
- 	mutex_unlock(&codetag_lock);
- }
- 
-void codetag_load_module(struct module *mod)
-+int codetag_load_module(struct module *mod)
- {
- 	struct codetag_type *cttype;
-+	int ret = 0;
- 
- 	if (!mod)
-		return;
-+		return 0;
- 
- 	mutex_lock(&codetag_lock);
-	list_for_each_entry(cttype, &codetag_types, link)
-		codetag_module_init(cttype, mod);
-+	list_for_each_entry(cttype, &codetag_types, link) {
-+		ret = codetag_module_init(cttype, mod);
-+		if (ret)
-+			break;
-+	}
- 	mutex_unlock(&codetag_lock);
-+
-+	return ret;
- }
- 
- void codetag_unload_module(struct module *mod)
--- a/debian/patches/patchset-pf/fixes/0025-svcrdma-Unregister-the-device-if-svc_rdma_accept-fai.patch
+++ b/debian/patches/patchset-pf/fixes/0025-svcrdma-Unregister-the-device-if-svc_rdma_accept-fai.patch
@@ -1,29 +0,0 @@
-From 57fdc30dcdad60e3b868682cc1e77083c091aef5 Mon Sep 17 00:00:00 2001
-From: Chuck Lever <chuck.lever@oracle.com>
-Date: Sun, 27 Apr 2025 12:39:59 -0400
-Subject: svcrdma: Unregister the device if svc_rdma_accept() fails
-
-To handle device removal, svc_rdma_accept() requests removal
-notification for the underlying device when accepting a connection.
-However svc_rdma_free() is not invoked if svc_rdma_accept() fails.
-There needs to be a matching "unregister" in that case; otherwise
-the device cannot be removed.
-
-Fixes: c4de97f7c454 ("svcrdma: Handle device removal outside of the CM event handler")
-Cc: stable@vger.kernel.org
-Reviewed-by: Zhu Yanjun <yanjun.zhu@linux.dev>
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- net/sunrpc/xprtrdma/svc_rdma_transport.c | 1 +
- 1 file changed, 1 insertion(+)
-
--- a/net/sunrpc/xprtrdma/svc_rdma_transport.c
-+++ b/net/sunrpc/xprtrdma/svc_rdma_transport.c
-@@ -577,6 +577,7 @@ static struct svc_xprt *svc_rdma_accept(
- 	if (newxprt->sc_qp && !IS_ERR(newxprt->sc_qp))
- 		ib_destroy_qp(newxprt->sc_qp);
- 	rdma_destroy_id(newxprt->sc_cm_id);
-+	rpcrdma_rn_unregister(dev, &newxprt->sc_rn);
- 	/* This call to put will destroy the transport */
- 	svc_xprt_put(&newxprt->sc_xprt);
- 	return NULL;
--- a/debian/patches/patchset-pf/fixes/0026-SUNRPC-Prevent-hang-on-NFS-mount-with-xprtsec-m-tls.patch
+++ b/debian/patches/patchset-pf/fixes/0026-SUNRPC-Prevent-hang-on-NFS-mount-with-xprtsec-m-tls.patch
@@ -1,53 +0,0 @@
-From 92e99ba55ff0ce68ea7567331beda21861da2028 Mon Sep 17 00:00:00 2001
-From: Chuck Lever <chuck.lever@oracle.com>
-Date: Wed, 21 May 2025 16:34:13 -0400
-Subject: SUNRPC: Prevent hang on NFS mount with xprtsec=[m]tls
-
-Engineers at Hammerspace noticed that sometimes mounting with
-"xprtsec=tls" hangs for a minute or so, and then times out, even
-when the NFS server is reachable and responsive.
-
-kTLS shuts off data_ready callbacks if strp->msg_ready is set to
-mitigate data_ready callbacks when a full TLS record is not yet
-ready to be read from the socket.
-
-Normally msg_ready is clear when the first TLS record arrives on
-a socket. However, I observed that sometimes tls_setsockopt() sets
-strp->msg_ready, and that prevents forward progress because
-tls_data_ready() becomes a no-op.
-
-Moreover, Jakub says: "If there's a full record queued at the time
-when [tlshd] passes the socket back to the kernel, it's up to the
-reader to read the already queued data out." So SunRPC cannot
-expect a data_ready call when ingress data is already waiting.
-
-Add an explicit poll after SunRPC's upper transport is set up to
-pick up any data that arrived after the TLS handshake but before
-transport set-up is complete.
-
-Reported-by: Steve Sears <sjs@hammerspace.com>
-Suggested-by: Jakub Kacinski <kuba@kernel.org>
-Fixes: 75eb6af7acdf ("SUNRPC: Add a TCP-with-TLS RPC transport class")
-Tested-by: Mike Snitzer <snitzer@kernel.org>
-Reviewed-by: Mike Snitzer <snitzer@kernel.org>
-Cc: stable@vger.kernel.org
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
-Signed-off-by: Anna Schumaker <anna.schumaker@oracle.com>
---
- net/sunrpc/xprtsock.c | 5 +++++
- 1 file changed, 5 insertions(+)
-
--- a/net/sunrpc/xprtsock.c
-+++ b/net/sunrpc/xprtsock.c
-@@ -2740,6 +2740,11 @@ static void xs_tcp_tls_setup_socket(stru
- 	}
- 	rpc_shutdown_client(lower_clnt);
- 
-+	/* Check for ingress data that arrived before the socket's
-+	 * ->data_ready callback was set up.
-+	 */
-+	xs_poll_check_readable(upper_transport);
-+
- out_unlock:
- 	current_restore_flags(pflags, PF_MEMALLOC);
- 	upper_transport->clnt = NULL;
--- a/debian/patches/patchset-pf/fixes/0027-hv_netvsc-fix-potential-deadlock-in-netvsc_vf_setxdp.patch
+++ b/debian/patches/patchset-pf/fixes/0027-hv_netvsc-fix-potential-deadlock-in-netvsc_vf_setxdp.patch
@@ -1,89 +0,0 @@
-From ac0c5ac5efecec7f731a1d80ec40ef3d34adc5ee Mon Sep 17 00:00:00 2001
-From: Saurabh Sengar <ssengar@linux.microsoft.com>
-Date: Thu, 29 May 2025 03:18:30 -0700
-Subject: hv_netvsc: fix potential deadlock in netvsc_vf_setxdp()
-
-The MANA driver's probe registers netdevice via the following call chain:
-
-mana_probe()
-  register_netdev()
-    register_netdevice()
-
-register_netdevice() calls notifier callback for netvsc driver,
-holding the netdev mutex via netdev_lock_ops().
-
-Further this netvsc notifier callback end up attempting to acquire the
-same lock again in dev_xdp_propagate() leading to deadlock.
-
-netvsc_netdev_event()
-  netvsc_vf_setxdp()
-    dev_xdp_propagate()
-
-This deadlock was not observed so far because net_shaper_ops was never set,
-and thus the lock was effectively a no-op in this case. Fix this by using
-netif_xdp_propagate() instead of dev_xdp_propagate() to avoid recursive
-locking in this path.
-
-And, since no deadlock is observed on the other path which is via
-netvsc_probe, add the lock exclusivly for that path.
-
-Also, clean up the unregistration path by removing the unnecessary call to
-netvsc_vf_setxdp(), since unregister_netdevice_many_notify() already
-performs this cleanup via dev_xdp_uninstall().
-
-Fixes: 97246d6d21c2 ("net: hold netdev instance lock during ndo_bpf")
-Cc: stable@vger.kernel.org
-Signed-off-by: Saurabh Sengar <ssengar@linux.microsoft.com>
-Tested-by: Erni Sri Satya Vennela <ernis@linux.microsoft.com>
-Reviewed-by: Haiyang Zhang <haiyangz@microsoft.com>
-Reviewed-by: Subbaraya Sundeep <sbhatta@marvell.com>
-Link: https://patch.msgid.link/1748513910-23963-1-git-send-email-ssengar@linux.microsoft.com
-Signed-off-by: Jakub Kicinski <kuba@kernel.org>
---
- drivers/net/hyperv/netvsc_bpf.c | 2 +-
- drivers/net/hyperv/netvsc_drv.c | 4 ++--
- net/core/dev.c                  | 1 +
- 3 files changed, 4 insertions(+), 3 deletions(-)
-
--- a/drivers/net/hyperv/netvsc_bpf.c
-+++ b/drivers/net/hyperv/netvsc_bpf.c
-@@ -183,7 +183,7 @@ int netvsc_vf_setxdp(struct net_device *
- 	xdp.command = XDP_SETUP_PROG;
- 	xdp.prog = prog;
- 
-	ret = dev_xdp_propagate(vf_netdev, &xdp);
-+	ret = netif_xdp_propagate(vf_netdev, &xdp);
- 
- 	if (ret && prog)
- 		bpf_prog_put(prog);
--- a/drivers/net/hyperv/netvsc_drv.c
-+++ b/drivers/net/hyperv/netvsc_drv.c
-@@ -2462,8 +2462,6 @@ static int netvsc_unregister_vf(struct n
- 
- 	netdev_info(ndev, "VF unregistering: %s\n", vf_netdev->name);
- 
-	netvsc_vf_setxdp(vf_netdev, NULL);
-
- 	reinit_completion(&net_device_ctx->vf_add);
- 	netdev_rx_handler_unregister(vf_netdev);
- 	netdev_upper_dev_unlink(vf_netdev, ndev);
-@@ -2631,7 +2629,9 @@ static int netvsc_probe(struct hv_device
- 			continue;
- 
- 		netvsc_prepare_bonding(vf_netdev);
-+		netdev_lock_ops(vf_netdev);
- 		netvsc_register_vf(vf_netdev, VF_REG_IN_PROBE);
-+		netdev_unlock_ops(vf_netdev);
- 		__netvsc_vf_setup(net, vf_netdev);
- 		break;
- 	}
--- a/net/core/dev.c
-+++ b/net/core/dev.c
-@@ -9863,6 +9863,7 @@ int netif_xdp_propagate(struct net_devic
- 
- 	return dev->netdev_ops->ndo_bpf(dev, bpf);
- }
-+EXPORT_SYMBOL_GPL(netif_xdp_propagate);
- 
- u32 dev_xdp_prog_id(struct net_device *dev, enum bpf_xdp_mode mode)
- {
--- a/debian/patches/patchset-pf/fixes/0028-net-clear-the-dst-when-changing-skb-protocol.patch
+++ b/debian/patches/patchset-pf/fixes/0028-net-clear-the-dst-when-changing-skb-protocol.patch
@@ -1,113 +0,0 @@
-From 485c82a86fb97fb86cac303348c85b6cf71fd787 Mon Sep 17 00:00:00 2001
-From: Jakub Kicinski <kuba@kernel.org>
-Date: Mon, 9 Jun 2025 17:12:44 -0700
-Subject: net: clear the dst when changing skb protocol
-MIME-Version: 1.0
-Content-Type: text/plain; charset=UTF-8
-Content-Transfer-Encoding: 8bit
-
-A not-so-careful NAT46 BPF program can crash the kernel
-if it indiscriminately flips ingress packets from v4 to v6:
-
-  BUG: kernel NULL pointer dereference, address: 0000000000000000
-    ip6_rcv_core (net/ipv6/ip6_input.c:190:20)
-    ipv6_rcv (net/ipv6/ip6_input.c:306:8)
-    process_backlog (net/core/dev.c:6186:4)
-    napi_poll (net/core/dev.c:6906:9)
-    net_rx_action (net/core/dev.c:7028:13)
-    do_softirq (kernel/softirq.c:462:3)
-    netif_rx (net/core/dev.c:5326:3)
-    dev_loopback_xmit (net/core/dev.c:4015:2)
-    ip_mc_finish_output (net/ipv4/ip_output.c:363:8)
-    NF_HOOK (./include/linux/netfilter.h:314:9)
-    ip_mc_output (net/ipv4/ip_output.c:400:5)
-    dst_output (./include/net/dst.h:459:9)
-    ip_local_out (net/ipv4/ip_output.c:130:9)
-    ip_send_skb (net/ipv4/ip_output.c:1496:8)
-    udp_send_skb (net/ipv4/udp.c:1040:8)
-    udp_sendmsg (net/ipv4/udp.c:1328:10)
-
-The output interface has a 4->6 program attached at ingress.
-We try to loop the multicast skb back to the sending socket.
-Ingress BPF runs as part of netif_rx(), pushes a valid v6 hdr
-and changes skb->protocol to v6. We enter ip6_rcv_core which
-tries to use skb_dst(). But the dst is still an IPv4 one left
-after IPv4 mcast output.
-
-Clear the dst in all BPF helpers which change the protocol.
-Try to preserve metadata dsts, those may carry non-routing
-metadata.
-
-Cc: stable@vger.kernel.org
-Reviewed-by: Maciej Żenczykowski <maze@google.com>
-Acked-by: Daniel Borkmann <daniel@iogearbox.net>
-Fixes: d219df60a70e ("bpf: Add ipip6 and ip6ip decap support for bpf_skb_adjust_room()")
-Fixes: 1b00e0dfe7d0 ("bpf: update skb->protocol in bpf_skb_net_grow")
-Fixes: 6578171a7ff0 ("bpf: add bpf_skb_change_proto helper")
-Reviewed-by: Willem de Bruijn <willemb@google.com>
-Link: https://patch.msgid.link/20250610001245.1981782-1-kuba@kernel.org
-Signed-off-by: Jakub Kicinski <kuba@kernel.org>
---
- net/core/filter.c | 19 +++++++++++++------
- 1 file changed, 13 insertions(+), 6 deletions(-)
-
--- a/net/core/filter.c
-+++ b/net/core/filter.c
-@@ -3233,6 +3233,13 @@ static const struct bpf_func_proto bpf_s
- 	.arg1_type      = ARG_PTR_TO_CTX,
- };
- 
-+static void bpf_skb_change_protocol(struct sk_buff *skb, u16 proto)
-+{
-+	skb->protocol = htons(proto);
-+	if (skb_valid_dst(skb))
-+		skb_dst_drop(skb);
-+}
-+
- static int bpf_skb_generic_push(struct sk_buff *skb, u32 off, u32 len)
- {
- 	/* Caller already did skb_cow() with len as headroom,
-@@ -3329,7 +3336,7 @@ static int bpf_skb_proto_4_to_6(struct s
- 		}
- 	}
- 
-	skb->protocol = htons(ETH_P_IPV6);
-+	bpf_skb_change_protocol(skb, ETH_P_IPV6);
- 	skb_clear_hash(skb);
- 
- 	return 0;
-@@ -3359,7 +3366,7 @@ static int bpf_skb_proto_6_to_4(struct s
- 		}
- 	}
- 
-	skb->protocol = htons(ETH_P_IP);
-+	bpf_skb_change_protocol(skb, ETH_P_IP);
- 	skb_clear_hash(skb);
- 
- 	return 0;
-@@ -3550,10 +3557,10 @@ static int bpf_skb_net_grow(struct sk_bu
- 		/* Match skb->protocol to new outer l3 protocol */
- 		if (skb->protocol == htons(ETH_P_IP) &&
- 		    flags & BPF_F_ADJ_ROOM_ENCAP_L3_IPV6)
-			skb->protocol = htons(ETH_P_IPV6);
-+			bpf_skb_change_protocol(skb, ETH_P_IPV6);
- 		else if (skb->protocol == htons(ETH_P_IPV6) &&
- 			 flags & BPF_F_ADJ_ROOM_ENCAP_L3_IPV4)
-			skb->protocol = htons(ETH_P_IP);
-+			bpf_skb_change_protocol(skb, ETH_P_IP);
- 	}
- 
- 	if (skb_is_gso(skb)) {
-@@ -3606,10 +3613,10 @@ static int bpf_skb_net_shrink(struct sk_
- 	/* Match skb->protocol to new outer l3 protocol */
- 	if (skb->protocol == htons(ETH_P_IP) &&
- 	    flags & BPF_F_ADJ_ROOM_DECAP_L3_IPV6)
-		skb->protocol = htons(ETH_P_IPV6);
-+		bpf_skb_change_protocol(skb, ETH_P_IPV6);
- 	else if (skb->protocol == htons(ETH_P_IPV6) &&
- 		 flags & BPF_F_ADJ_ROOM_DECAP_L3_IPV4)
-		skb->protocol = htons(ETH_P_IP);
-+		bpf_skb_change_protocol(skb, ETH_P_IP);
- 
- 	if (skb_is_gso(skb)) {
- 		struct skb_shared_info *shinfo = skb_shinfo(skb);
--- a/debian/patches/patchset-pf/fixes/0029-net_sched-sch_sfq-reject-invalid-perturb-period.patch
+++ b/debian/patches/patchset-pf/fixes/0029-net_sched-sch_sfq-reject-invalid-perturb-period.patch
@@ -1,67 +0,0 @@
-From 2bf1f4a3adcecc53c1012e460d1412cece3747ce Mon Sep 17 00:00:00 2001
-From: Eric Dumazet <edumazet@google.com>
-Date: Wed, 11 Jun 2025 08:35:01 +0000
-Subject: net_sched: sch_sfq: reject invalid perturb period
-
-Gerrard Tai reported that SFQ perturb_period has no range check yet,
-and this can be used to trigger a race condition fixed in a separate patch.
-
-We want to make sure ctl->perturb_period * HZ will not overflow
-and is positive.
-
-Tested:
-
-tc qd add dev lo root sfq perturb -10   # negative value : error
-Error: sch_sfq: invalid perturb period.
-
-tc qd add dev lo root sfq perturb 1000000000 # too big : error
-Error: sch_sfq: invalid perturb period.
-
-tc qd add dev lo root sfq perturb 2000000 # acceptable value
-tc -s -d qd sh dev lo
-qdisc sfq 8005: root refcnt 2 limit 127p quantum 64Kb depth 127 flows 128 divisor 1024 perturb 2000000sec
- Sent 0 bytes 0 pkt (dropped 0, overlimits 0 requeues 0)
- backlog 0b 0p requeues 0
-
-Fixes: 1da177e4c3f4 ("Linux-2.6.12-rc2")
-Reported-by: Gerrard Tai <gerrard.tai@starlabs.sg>
-Signed-off-by: Eric Dumazet <edumazet@google.com>
-Cc: stable@vger.kernel.org
-Link: https://patch.msgid.link/20250611083501.1810459-1-edumazet@google.com
-Signed-off-by: Jakub Kicinski <kuba@kernel.org>
---
- net/sched/sch_sfq.c | 10 ++++++++--
- 1 file changed, 8 insertions(+), 2 deletions(-)
-
--- a/net/sched/sch_sfq.c
-+++ b/net/sched/sch_sfq.c
-@@ -656,6 +656,14 @@ static int sfq_change(struct Qdisc *sch,
- 		NL_SET_ERR_MSG_MOD(extack, "invalid quantum");
- 		return -EINVAL;
- 	}
-+
-+	if (ctl->perturb_period < 0 ||
-+	    ctl->perturb_period > INT_MAX / HZ) {
-+		NL_SET_ERR_MSG_MOD(extack, "invalid perturb period");
-+		return -EINVAL;
-+	}
-+	perturb_period = ctl->perturb_period * HZ;
-+
- 	if (ctl_v1 && !red_check_params(ctl_v1->qth_min, ctl_v1->qth_max,
- 					ctl_v1->Wlog, ctl_v1->Scell_log, NULL))
- 		return -EINVAL;
-@@ -672,14 +680,12 @@ static int sfq_change(struct Qdisc *sch,
- 	headdrop = q->headdrop;
- 	maxdepth = q->maxdepth;
- 	maxflows = q->maxflows;
-	perturb_period = q->perturb_period;
- 	quantum = q->quantum;
- 	flags = q->flags;
- 
- 	/* update and validate configuration */
- 	if (ctl->quantum)
- 		quantum = ctl->quantum;
-	perturb_period = ctl->perturb_period * HZ;
- 	if (ctl->flows)
- 		maxflows = min_t(u32, ctl->flows, SFQ_MAX_FLOWS);
- 	if (ctl->divisor) {
--- a/debian/patches/patchset-pf/fixes/0030-mm-vma-reset-VMA-iterator-on-commit_merge-OOM-failur.patch
+++ b/debian/patches/patchset-pf/fixes/0030-mm-vma-reset-VMA-iterator-on-commit_merge-OOM-failur.patch
@@ -1,93 +0,0 @@
-From 90a5248443f925040b46e32fcf6715615c73e396 Mon Sep 17 00:00:00 2001
-From: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Date: Fri, 6 Jun 2025 13:50:32 +0100
-Subject: mm/vma: reset VMA iterator on commit_merge() OOM failure
-
-While an OOM failure in commit_merge() isn't really feasible due to the
-allocation which might fail (a maple tree pre-allocation) being 'too small
-to fail', we do need to handle this case correctly regardless.
-
-In vma_merge_existing_range(), we can theoretically encounter failures
-which result in an OOM error in two ways - firstly dup_anon_vma() might
-fail with an OOM error, and secondly commit_merge() failing, ultimately,
-to pre-allocate a maple tree node.
-
-The abort logic for dup_anon_vma() resets the VMA iterator to the initial
-range, ensuring that any logic looping on this iterator will correctly
-proceed to the next VMA.
-
-However the commit_merge() abort logic does not do the same thing.  This
-resulted in a syzbot report occurring because mlockall() iterates through
-VMAs, is tolerant of errors, but ended up with an incorrect previous VMA
-being specified due to incorrect iterator state.
-
-While making this change, it became apparent we are duplicating logic -
-the logic introduced in commit 41e6ddcaa0f1 ("mm/vma: add give_up_on_oom
-option on modify/merge, use in uffd release") duplicates the
-vmg->give_up_on_oom check in both abort branches.
-
-Additionally, we observe that we can perform the anon_dup check safely on
-dup_anon_vma() failure, as this will not be modified should this call
-fail.
-
-Finally, we need to reset the iterator in both cases, so now we can simply
-use the exact same code to abort for both.
-
-We remove the VM_WARN_ON(err != -ENOMEM) as it would be silly for this to
-be otherwise and it allows us to implement the abort check more neatly.
-
-Link: https://lkml.kernel.org/r/20250606125032.164249-1-lorenzo.stoakes@oracle.com
-Fixes: 47b16d0462a4 ("mm: abort vma_modify() on merge out of memory failure")
-Signed-off-by: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Reported-by: syzbot+d16409ea9ecc16ed261a@syzkaller.appspotmail.com
-Closes: https://lore.kernel.org/linux-mm/6842cc67.a00a0220.29ac89.003b.GAE@google.com/
-Reviewed-by: Pedro Falcato <pfalcato@suse.de>
-Reviewed-by: Vlastimil Babka <vbabka@suse.cz>
-Reviewed-by: Liam R. Howlett <Liam.Howlett@oracle.com>
-Cc: Jann Horn <jannh@google.com>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- mm/vma.c | 22 ++++------------------
- 1 file changed, 4 insertions(+), 18 deletions(-)
-
--- a/mm/vma.c
-+++ b/mm/vma.c
-@@ -927,26 +927,9 @@ static __must_check struct vm_area_struc
- 		err = dup_anon_vma(next, middle, &anon_dup);
- 	}
- 
-	if (err)
-+	if (err || commit_merge(vmg))
- 		goto abort;
- 
-	err = commit_merge(vmg);
-	if (err) {
-		VM_WARN_ON(err != -ENOMEM);
-
-		if (anon_dup)
-			unlink_anon_vmas(anon_dup);
-
-		/*
-		 * We've cleaned up any cloned anon_vma's, no VMAs have been
-		 * modified, no harm no foul if the user requests that we not
-		 * report this and just give up, leaving the VMAs unmerged.
-		 */
-		if (!vmg->give_up_on_oom)
-			vmg->state = VMA_MERGE_ERROR_NOMEM;
-		return NULL;
-	}
-
- 	khugepaged_enter_vma(vmg->target, vmg->flags);
- 	vmg->state = VMA_MERGE_SUCCESS;
- 	return vmg->target;
-@@ -955,6 +938,9 @@ abort:
- 	vma_iter_set(vmg->vmi, start);
- 	vma_iter_load(vmg->vmi);
- 
-+	if (anon_dup)
-+		unlink_anon_vmas(anon_dup);
-+
- 	/*
- 	 * This means we have failed to clone anon_vma's correctly, but no
- 	 * actual changes to VMAs have occurred, so no harm no foul - if the
--- a/debian/patches/patchset-pf/fixes/0031-mm-close-theoretical-race-where-stale-TLB-entries-co.patch
+++ b/debian/patches/patchset-pf/fixes/0031-mm-close-theoretical-race-where-stale-TLB-entries-co.patch
@@ -1,90 +0,0 @@
-From 7c9d5350d8acfe1b876a8acabdf247b44a803d58 Mon Sep 17 00:00:00 2001
-From: Ryan Roberts <ryan.roberts@arm.com>
-Date: Fri, 6 Jun 2025 10:28:07 +0100
-Subject: mm: close theoretical race where stale TLB entries could linger
-
-Commit 3ea277194daa ("mm, mprotect: flush TLB if potentially racing with a
-parallel reclaim leaving stale TLB entries") described a theoretical race
-as such:
-
-
-"""
-Nadav Amit identified a theoretical race between page reclaim and mprotect
-due to TLB flushes being batched outside of the PTL being held.
-
-He described the race as follows:
-
-	CPU0                            CPU1
-	----                            ----
-					user accesses memory using RW PTE
-					[PTE now cached in TLB]
-	try_to_unmap_one()
-	==> ptep_get_and_clear()
-	==> set_tlb_ubc_flush_pending()
-					mprotect(addr, PROT_READ)
-					==> change_pte_range()
-					==> [ PTE non-present - no flush ]
-
-					user writes using cached RW PTE
-	...
-
-	try_to_unmap_flush()
-
-The same type of race exists for reads when protecting for PROT_NONE and
-also exists for operations that can leave an old TLB entry behind such as
-munmap, mremap and madvise.
-"""
-
-The solution was to introduce flush_tlb_batched_pending() and call it
-under the PTL from mprotect/madvise/munmap/mremap to complete any pending
-tlb flushes.
-
-However, while madvise_free_pte_range() and
-madvise_cold_or_pageout_pte_range() were both retro-fitted to call
-flush_tlb_batched_pending() immediately after initially acquiring the PTL,
-they both temporarily release the PTL to split a large folio if they
-stumble upon one.  In this case, where re-acquiring the PTL
-flush_tlb_batched_pending() must be called again, but it previously was
-not.  Let's fix that.
-
-There are 2 Fixes: tags here: the first is the commit that fixed
-madvise_free_pte_range().  The second is the commit that added
-madvise_cold_or_pageout_pte_range(), which looks like it copy/pasted the
-faulty pattern from madvise_free_pte_range().
-
-This is a theoretical bug discovered during code review.
-
-Link: https://lkml.kernel.org/r/20250606092809.4194056-1-ryan.roberts@arm.com
-Fixes: 3ea277194daa ("mm, mprotect: flush TLB if potentially racing with a parallel reclaim leaving stale TLB entries")
-Fixes: 9c276cc65a58 ("mm: introduce MADV_COLD")
-Signed-off-by: Ryan Roberts <ryan.roberts@arm.com>
-Reviewed-by: Jann Horn <jannh@google.com>
-Acked-by: David Hildenbrand <david@redhat.com>
-Cc: Liam Howlett <liam.howlett@oracle.com>
-Cc: Lorenzo Stoakes <lorenzo.stoakes@oracle.com>
-Cc: Mel Gorman <mgorman <mgorman@suse.de>
-Cc: Vlastimil Babka <vbabka@suse.cz>
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Andrew Morton <akpm@linux-foundation.org>
---
- mm/madvise.c | 2 ++
- 1 file changed, 2 insertions(+)
-
--- a/mm/madvise.c
-+++ b/mm/madvise.c
-@@ -503,6 +503,7 @@ restart:
- 					pte_offset_map_lock(mm, pmd, addr, &ptl);
- 				if (!start_pte)
- 					break;
-+				flush_tlb_batched_pending(mm);
- 				arch_enter_lazy_mmu_mode();
- 				if (!err)
- 					nr = 0;
-@@ -736,6 +737,7 @@ static int madvise_free_pte_range(pmd_t
- 				start_pte = pte;
- 				if (!start_pte)
- 					break;
-+				flush_tlb_batched_pending(mm);
- 				arch_enter_lazy_mmu_mode();
- 				if (!err)
- 					nr = 0;
--- a/debian/patches/patchset-pf/fixes/0032-io_uring-kbuf-don-t-truncate-end-buffer-for-multiple.patch
+++ b/debian/patches/patchset-pf/fixes/0032-io_uring-kbuf-don-t-truncate-end-buffer-for-multiple.patch
@@ -1,33 +0,0 @@
-From 862a81c79f0bea8ede0352b637b44716f02f71b9 Mon Sep 17 00:00:00 2001
-From: Jens Axboe <axboe@kernel.dk>
-Date: Fri, 13 Jun 2025 11:01:49 -0600
-Subject: io_uring/kbuf: don't truncate end buffer for multiple buffer peeks
-
-If peeking a bunch of buffers, normally io_ring_buffers_peek() will
-truncate the end buffer. This isn't optimal as presumably more data will
-be arriving later, and hence it's better to stop with the last full
-buffer rather than truncate the end buffer.
-
-Cc: stable@vger.kernel.org
-Fixes: 35c8711c8fc4 ("io_uring/kbuf: add helpers for getting/peeking multiple buffers")
-Reported-by: Christian Mazakas <christian.mazakas@gmail.com>
-Signed-off-by: Jens Axboe <axboe@kernel.dk>
---
- io_uring/kbuf.c | 5 ++++-
- 1 file changed, 4 insertions(+), 1 deletion(-)
-
--- a/io_uring/kbuf.c
-+++ b/io_uring/kbuf.c
-@@ -270,8 +270,11 @@ static int io_ring_buffers_peek(struct i
- 		/* truncate end piece, if needed, for non partial buffers */
- 		if (len > arg->max_len) {
- 			len = arg->max_len;
-			if (!(bl->flags & IOBL_INC))
-+			if (!(bl->flags & IOBL_INC)) {
-+				if (iov != arg->iovs)
-+					break;
- 				buf->len = len;
-+			}
- 		}
- 
- 		iov->iov_base = u64_to_user_ptr(buf->addr);
--- a/debian/patches/patchset-pf/fixes/0033-nvme-always-punt-polled-uring_cmd-end_io-work-to-tas.patch
+++ b/debian/patches/patchset-pf/fixes/0033-nvme-always-punt-polled-uring_cmd-end_io-work-to-tas.patch
@@ -1,54 +0,0 @@
-From bb3d761325a1707c8064a3d7dd556ed6a501a2e7 Mon Sep 17 00:00:00 2001
-From: Jens Axboe <axboe@kernel.dk>
-Date: Fri, 13 Jun 2025 13:37:41 -0600
-Subject: nvme: always punt polled uring_cmd end_io work to task_work
-
-Currently NVMe uring_cmd completions will complete locally, if they are
-polled. This is done because those completions are always invoked from
-task context. And while that is true, there's no guarantee that it's
-invoked under the right ring context, or even task. If someone does
-NVMe passthrough via multiple threads and with a limited number of
-poll queues, then ringA may find completions from ringB. For that case,
-completing the request may not be sound.
-
-Always just punt the passthrough completions via task_work, which will
-redirect the completion, if needed.
-
-Cc: stable@vger.kernel.org
-Fixes: 585079b6e425 ("nvme: wire up async polling for io passthrough commands")
-Signed-off-by: Jens Axboe <axboe@kernel.dk>
---
- drivers/nvme/host/ioctl.c | 21 +++++++--------------
- 1 file changed, 7 insertions(+), 14 deletions(-)
-
--- a/drivers/nvme/host/ioctl.c
-+++ b/drivers/nvme/host/ioctl.c
-@@ -429,21 +429,14 @@ static enum rq_end_io_ret nvme_uring_cmd
- 	pdu->result = le64_to_cpu(nvme_req(req)->result.u64);
- 
- 	/*
-	 * For iopoll, complete it directly. Note that using the uring_cmd
-	 * helper for this is safe only because we check blk_rq_is_poll().
-	 * As that returns false if we're NOT on a polled queue, then it's
-	 * safe to use the polled completion helper.
-	 *
-	 * Otherwise, move the completion to task work.
-+	 * IOPOLL could potentially complete this request directly, but
-+	 * if multiple rings are polling on the same queue, then it's possible
-+	 * for one ring to find completions for another ring. Punting the
-+	 * completion via task_work will always direct it to the right
-+	 * location, rather than potentially complete requests for ringA
-+	 * under iopoll invocations from ringB.
- 	 */
-	if (blk_rq_is_poll(req)) {
-		if (pdu->bio)
-			blk_rq_unmap_user(pdu->bio);
-		io_uring_cmd_iopoll_done(ioucmd, pdu->result, pdu->status);
-	} else {
-		io_uring_cmd_do_in_task_lazy(ioucmd, nvme_uring_task_cb);
-	}
-
-+	io_uring_cmd_do_in_task_lazy(ioucmd, nvme_uring_task_cb);
- 	return RQ_END_IO_FREE;
- }
- 
--- a/debian/patches/patchset-pf/fixes/0034-block-Clear-BIO_EMULATES_ZONE_APPEND-flag-on-BIO-com.patch
+++ b/debian/patches/patchset-pf/fixes/0034-block-Clear-BIO_EMULATES_ZONE_APPEND-flag-on-BIO-com.patch
@@ -1,33 +0,0 @@
-From a57621608b2cbcbd0c7da184e9012b9b111a8577 Mon Sep 17 00:00:00 2001
-From: Damien Le Moal <dlemoal@kernel.org>
-Date: Wed, 11 Jun 2025 09:59:15 +0900
-Subject: block: Clear BIO_EMULATES_ZONE_APPEND flag on BIO completion
-
-When blk_zone_write_plug_bio_endio() is called for a regular write BIO
-used to emulate a zone append operation, that is, a BIO flagged with
-BIO_EMULATES_ZONE_APPEND, the BIO operation code is restored to the
-original REQ_OP_ZONE_APPEND but the BIO_EMULATES_ZONE_APPEND flag is not
-cleared. Clear it to fully return the BIO to its orginal definition.
-
-Fixes: 9b1ce7f0c6f8 ("block: Implement zone append emulation")
-Cc: stable@vger.kernel.org
-Signed-off-by: Damien Le Moal <dlemoal@kernel.org>
-Reviewed-by: Johannes Thumshirn <johannes.thumshirn@wdc.com>
-Reviewed-by: Hannes Reinecke <hare@suse.de>
-Reviewed-by: Christoph Hellwig <hch@lst.de>
-Link: https://lore.kernel.org/r/20250611005915.89843-1-dlemoal@kernel.org
-Signed-off-by: Jens Axboe <axboe@kernel.dk>
---
- block/blk-zoned.c | 1 +
- 1 file changed, 1 insertion(+)
-
--- a/block/blk-zoned.c
-+++ b/block/blk-zoned.c
-@@ -1225,6 +1225,7 @@ void blk_zone_write_plug_bio_endio(struc
- 	if (bio_flagged(bio, BIO_EMULATES_ZONE_APPEND)) {
- 		bio->bi_opf &= ~REQ_OP_MASK;
- 		bio->bi_opf |= REQ_OP_ZONE_APPEND;
-+		bio_clear_flag(bio, BIO_EMULATES_ZONE_APPEND);
- 	}
- 
- 	/*
--- a/debian/patches/patchset-pf/fixes/0035-block-use-plug-request-list-tail-for-one-shot-backme.patch
+++ b/debian/patches/patchset-pf/fixes/0035-block-use-plug-request-list-tail-for-one-shot-backme.patch
@@ -1,65 +0,0 @@
-From 7fc5a2cbcc8459cab6ae8c5dd1220768027ccb70 Mon Sep 17 00:00:00 2001
-From: Jens Axboe <axboe@kernel.dk>
-Date: Wed, 11 Jun 2025 08:48:46 -0600
-Subject: block: use plug request list tail for one-shot backmerge attempt
-
-Previously, the block layer stored the requests in the plug list in
-LIFO order. For this reason, blk_attempt_plug_merge() would check
-just the head entry for a back merge attempt, and abort after that
-unless requests for multiple queues existed in the plug list. If more
-than one request is present in the plug list, this makes the one-shot
-back merging less useful than before, as it'll always fail to find a
-quick merge candidate.
-
-Use the tail entry for the one-shot merge attempt, which is the last
-added request in the list. If that fails, abort immediately unless
-there are multiple queues available. If multiple queues are available,
-then scan the list. Ideally the latter scan would be a backwards scan
-of the list, but as it currently stands, the plug list is singly linked
-and hence this isn't easily feasible.
-
-Cc: stable@vger.kernel.org
-Link: https://lore.kernel.org/linux-block/20250611121626.7252-1-abuehaze@amazon.com/
-Reported-by: Hazem Mohamed Abuelfotoh <abuehaze@amazon.com>
-Fixes: e70c301faece ("block: don't reorder requests in blk_add_rq_to_plug")
-Signed-off-by: Jens Axboe <axboe@kernel.dk>
---
- block/blk-merge.c | 26 +++++++++++++-------------
- 1 file changed, 13 insertions(+), 13 deletions(-)
-
--- a/block/blk-merge.c
-+++ b/block/blk-merge.c
-@@ -1127,20 +1127,20 @@ bool blk_attempt_plug_merge(struct reque
- 	if (!plug || rq_list_empty(&plug->mq_list))
- 		return false;
- 
-	rq_list_for_each(&plug->mq_list, rq) {
-		if (rq->q == q) {
-			if (blk_attempt_bio_merge(q, rq, bio, nr_segs, false) ==
-			    BIO_MERGE_OK)
-				return true;
-			break;
-		}
-+	rq = plug->mq_list.tail;
-+	if (rq->q == q)
-+		return blk_attempt_bio_merge(q, rq, bio, nr_segs, false) ==
-+			BIO_MERGE_OK;
-+	else if (!plug->multiple_queues)
-+		return false;
- 
-		/*
-		 * Only keep iterating plug list for merges if we have multiple
-		 * queues
-		 */
-		if (!plug->multiple_queues)
-			break;
-+	rq_list_for_each(&plug->mq_list, rq) {
-+		if (rq->q != q)
-+			continue;
-+		if (blk_attempt_bio_merge(q, rq, bio, nr_segs, false) ==
-+		    BIO_MERGE_OK)
-+			return true;
-+		break;
- 	}
- 	return false;
- }
--- a/debian/patches/patchset-pf/fixes/0036-Revert-mm-execmem-Unify-early-execmem_cache-behaviou.patch
+++ b/debian/patches/patchset-pf/fixes/0036-Revert-mm-execmem-Unify-early-execmem_cache-behaviou.patch
@@ -1,149 +0,0 @@
-From 8ad4520fc849262ab23adbabebd366d4755035bc Mon Sep 17 00:00:00 2001
-From: "Mike Rapoport (Microsoft)" <rppt@kernel.org>
-Date: Tue, 3 Jun 2025 14:14:45 +0300
-Subject: Revert "mm/execmem: Unify early execmem_cache behaviour"
-
-The commit d6d1e3e6580c ("mm/execmem: Unify early execmem_cache
-behaviour") changed early behaviour of execemem ROX cache to allow its
-usage in early x86 code that allocates text pages when
-CONFIG_MITGATION_ITS is enabled.
-
-The permission management of the pages allocated from execmem for ITS
-mitigation is now completely contained in arch/x86/kernel/alternatives.c
-and therefore there is no need to special case early allocations in
-execmem.
-
-This reverts commit d6d1e3e6580ca35071ad474381f053cbf1fb6414.
-
-Signed-off-by: Mike Rapoport (Microsoft) <rppt@kernel.org>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Cc: stable@vger.kernel.org
-Link: https://lkml.kernel.org/r/20250603111446.2609381-6-rppt@kernel.org
---
- arch/x86/mm/init_32.c   |  3 ---
- arch/x86/mm/init_64.c   |  3 ---
- include/linux/execmem.h |  8 +-------
- mm/execmem.c            | 40 +++-------------------------------------
- 4 files changed, 4 insertions(+), 50 deletions(-)
-
--- a/arch/x86/mm/init_32.c
-+++ b/arch/x86/mm/init_32.c
-@@ -30,7 +30,6 @@
- #include <linux/initrd.h>
- #include <linux/cpumask.h>
- #include <linux/gfp.h>
-#include <linux/execmem.h>
- 
- #include <asm/asm.h>
- #include <asm/bios_ebda.h>
-@@ -756,8 +755,6 @@ void mark_rodata_ro(void)
- 	pr_info("Write protecting kernel text and read-only data: %luk\n",
- 		size >> 10);
- 
-	execmem_cache_make_ro();
-
- 	kernel_set_to_readonly = 1;
- 
- #ifdef CONFIG_CPA_DEBUG
--- a/arch/x86/mm/init_64.c
-+++ b/arch/x86/mm/init_64.c
-@@ -34,7 +34,6 @@
- #include <linux/gfp.h>
- #include <linux/kcore.h>
- #include <linux/bootmem_info.h>
-#include <linux/execmem.h>
- 
- #include <asm/processor.h>
- #include <asm/bios_ebda.h>
-@@ -1392,8 +1391,6 @@ void mark_rodata_ro(void)
- 	       (end - start) >> 10);
- 	set_memory_ro(start, (end - start) >> PAGE_SHIFT);
- 
-	execmem_cache_make_ro();
-
- 	kernel_set_to_readonly = 1;
- 
- 	/*
--- a/include/linux/execmem.h
-+++ b/include/linux/execmem.h
-@@ -54,7 +54,7 @@ enum execmem_range_flags {
- 	EXECMEM_ROX_CACHE	= (1 << 1),
- };
- 
-#if defined(CONFIG_ARCH_HAS_EXECMEM_ROX) && defined(CONFIG_EXECMEM)
-+#ifdef CONFIG_ARCH_HAS_EXECMEM_ROX
- /**
-  * execmem_fill_trapping_insns - set memory to contain instructions that
-  *				 will trap
-@@ -94,15 +94,9 @@ int execmem_make_temp_rw(void *ptr, size
-  * Return: 0 on success or negative error code on failure.
-  */
- int execmem_restore_rox(void *ptr, size_t size);
-
-/*
- * Called from mark_readonly(), where the system transitions to ROX.
- */
-void execmem_cache_make_ro(void);
- #else
- static inline int execmem_make_temp_rw(void *ptr, size_t size) { return 0; }
- static inline int execmem_restore_rox(void *ptr, size_t size) { return 0; }
-static inline void execmem_cache_make_ro(void) { }
- #endif
- 
- /**
--- a/mm/execmem.c
-+++ b/mm/execmem.c
-@@ -254,34 +254,6 @@ out_unlock:
- 	return ptr;
- }
- 
-static bool execmem_cache_rox = false;
-
-void execmem_cache_make_ro(void)
-{
-	struct maple_tree *free_areas = &execmem_cache.free_areas;
-	struct maple_tree *busy_areas = &execmem_cache.busy_areas;
-	MA_STATE(mas_free, free_areas, 0, ULONG_MAX);
-	MA_STATE(mas_busy, busy_areas, 0, ULONG_MAX);
-	struct mutex *mutex = &execmem_cache.mutex;
-	void *area;
-
-	execmem_cache_rox = true;
-
-	mutex_lock(mutex);
-
-	mas_for_each(&mas_free, area, ULONG_MAX) {
-		unsigned long pages = mas_range_len(&mas_free) >> PAGE_SHIFT;
-		set_memory_ro(mas_free.index, pages);
-	}
-
-	mas_for_each(&mas_busy, area, ULONG_MAX) {
-		unsigned long pages = mas_range_len(&mas_busy) >> PAGE_SHIFT;
-		set_memory_ro(mas_busy.index, pages);
-	}
-
-	mutex_unlock(mutex);
-}
-
- static int execmem_cache_populate(struct execmem_range *range, size_t size)
- {
- 	unsigned long vm_flags = VM_ALLOW_HUGE_VMAP;
-@@ -302,15 +274,9 @@ static int execmem_cache_populate(struct
- 	/* fill memory with instructions that will trap */
- 	execmem_fill_trapping_insns(p, alloc_size, /* writable = */ true);
- 
-	if (execmem_cache_rox) {
-		err = set_memory_rox((unsigned long)p, vm->nr_pages);
-		if (err)
-			goto err_free_mem;
-	} else {
-		err = set_memory_x((unsigned long)p, vm->nr_pages);
-		if (err)
-			goto err_free_mem;
-	}
-+	err = set_memory_rox((unsigned long)p, vm->nr_pages);
-+	if (err)
-+		goto err_free_mem;
- 
- 	err = execmem_cache_add(p, alloc_size);
- 	if (err)
--- a/debian/patches/patchset-pf/fixes/0037-x86-virt-tdx-Avoid-indirect-calls-to-TDX-assembly-fu.patch
+++ b/debian/patches/patchset-pf/fixes/0037-x86-virt-tdx-Avoid-indirect-calls-to-TDX-assembly-fu.patch
@@ -1,63 +0,0 @@
-From 85bfdd784bd61df94fd42daca141ed173f647e8c Mon Sep 17 00:00:00 2001
-From: Kai Huang <kai.huang@intel.com>
-Date: Sat, 7 Jun 2025 01:07:37 +1200
-Subject: x86/virt/tdx: Avoid indirect calls to TDX assembly functions
-
-Two 'static inline' TDX helper functions (sc_retry() and
-sc_retry_prerr()) take function pointer arguments which refer to
-assembly functions.  Normally, the compiler inlines the TDX helper,
-realizes that the function pointer targets are completely static --
-thus can be resolved at compile time -- and generates direct call
-instructions.
-
-But, other times (like when CONFIG_CC_OPTIMIZE_FOR_SIZE=y), the
-compiler declines to inline the helpers and will instead generate
-indirect call instructions.
-
-Indirect calls to assembly functions require special annotation (for
-various Control Flow Integrity mechanisms).  But TDX assembly
-functions lack the special annotations and can only be called
-directly.
-
-Annotate both the helpers as '__always_inline' to prod the compiler
-into maintaining the direct calls. There is no guarantee here, but
-Peter has volunteered to report the compiler bug if this assumption
-ever breaks[1].
-
-Fixes: 1e66a7e27539 ("x86/virt/tdx: Handle SEAMCALL no entropy error in common code")
-Fixes: df01f5ae07dd ("x86/virt/tdx: Add SEAMCALL error printing for module initialization")
-Signed-off-by: Kai Huang <kai.huang@intel.com>
-Signed-off-by: Dave Hansen <dave.hansen@linux.intel.com>
-Cc: stable@vger.kernel.org
-Link: https://lore.kernel.org/lkml/20250605145914.GW39944@noisy.programming.kicks-ass.net/ [1]
-Link: https://lore.kernel.org/all/20250606130737.30713-1-kai.huang%40intel.com
---
- arch/x86/include/asm/tdx.h  | 2 +-
- arch/x86/virt/vmx/tdx/tdx.c | 5 +++--
- 2 files changed, 4 insertions(+), 3 deletions(-)
-
--- a/arch/x86/include/asm/tdx.h
-+++ b/arch/x86/include/asm/tdx.h
-@@ -100,7 +100,7 @@ void tdx_init(void);
- 
- typedef u64 (*sc_func_t)(u64 fn, struct tdx_module_args *args);
- 
-static inline u64 sc_retry(sc_func_t func, u64 fn,
-+static __always_inline u64 sc_retry(sc_func_t func, u64 fn,
- 			   struct tdx_module_args *args)
- {
- 	int retry = RDRAND_RETRY_LOOPS;
--- a/arch/x86/virt/vmx/tdx/tdx.c
-+++ b/arch/x86/virt/vmx/tdx/tdx.c
-@@ -69,8 +69,9 @@ static inline void seamcall_err_ret(u64
- 			args->r9, args->r10, args->r11);
- }
- 
-static inline int sc_retry_prerr(sc_func_t func, sc_err_func_t err_func,
-				 u64 fn, struct tdx_module_args *args)
-+static __always_inline int sc_retry_prerr(sc_func_t func,
-+					  sc_err_func_t err_func,
-+					  u64 fn, struct tdx_module_args *args)
- {
- 	u64 sret = sc_retry(func, fn, args);
- 
--- a/debian/patches/patchset-pf/fixes/0038-x86-mm-pat-don-t-collapse-pages-without-PSE-set.patch
+++ b/debian/patches/patchset-pf/fixes/0038-x86-mm-pat-don-t-collapse-pages-without-PSE-set.patch
@@ -1,31 +0,0 @@
-From a94cf5c6e7e31be9d4788916ce847adb15735d81 Mon Sep 17 00:00:00 2001
-From: Juergen Gross <jgross@suse.com>
-Date: Tue, 3 Jun 2025 14:14:41 +0300
-Subject: x86/mm/pat: don't collapse pages without PSE set
-
-Collapsing pages to a leaf PMD or PUD should be done only if
-X86_FEATURE_PSE is available, which is not the case when running e.g.
-as a Xen PV guest.
-
-Fixes: 41d88484c71c ("x86/mm/pat: restore large ROX pages after fragmentation")
-Signed-off-by: Juergen Gross <jgross@suse.com>
-Signed-off-by: Mike Rapoport (Microsoft) <rppt@kernel.org>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Cc: stable@vger.kernel.org
-Link: https://lore.kernel.org/r/20250528123557.12847-3-jgross@suse.com
---
- arch/x86/mm/pat/set_memory.c | 3 +++
- 1 file changed, 3 insertions(+)
-
--- a/arch/x86/mm/pat/set_memory.c
-+++ b/arch/x86/mm/pat/set_memory.c
-@@ -1257,6 +1257,9 @@ static int collapse_pmd_page(pmd_t *pmd,
- 	pgprot_t pgprot;
- 	int i = 0;
- 
-+	if (!cpu_feature_enabled(X86_FEATURE_PSE))
-+		return 0;
-+
- 	addr &= PMD_MASK;
- 	pte = pte_offset_kernel(pmd, addr);
- 	first = *pte;
--- a/debian/patches/patchset-pf/fixes/0039-x86-Kconfig-only-enable-ROX-cache-in-execmem-when-ST.patch
+++ b/debian/patches/patchset-pf/fixes/0039-x86-Kconfig-only-enable-ROX-cache-in-execmem-when-ST.patch
@@ -1,34 +0,0 @@
-From 8f28d595d167316469bb33b701e27b4b79c1aab1 Mon Sep 17 00:00:00 2001
-From: "Mike Rapoport (Microsoft)" <rppt@kernel.org>
-Date: Tue, 3 Jun 2025 14:14:42 +0300
-Subject: x86/Kconfig: only enable ROX cache in execmem when STRICT_MODULE_RWX
- is set
-
-Currently ROX cache in execmem is enabled regardless of
-STRICT_MODULE_RWX setting. This breaks an assumption that module memory
-is writable when STRICT_MODULE_RWX is disabled, for instance for kernel
-debuggin.
-
-Only enable ROX cache in execmem when STRICT_MODULE_RWX is set to
-restore the original behaviour of module text permissions.
-
-Fixes: 64f6a4e10c05 ("x86: re-enable EXECMEM_ROX support")
-Signed-off-by: Mike Rapoport (Microsoft) <rppt@kernel.org>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Cc: stable@vger.kernel.org
-Link: https://lkml.kernel.org/r/20250603111446.2609381-3-rppt@kernel.org
---
- arch/x86/Kconfig | 2 +-
- 1 file changed, 1 insertion(+), 1 deletion(-)
-
--- a/arch/x86/Kconfig
-+++ b/arch/x86/Kconfig
-@@ -88,7 +88,7 @@ config X86
- 	select ARCH_HAS_DMA_OPS			if GART_IOMMU || XEN
- 	select ARCH_HAS_EARLY_DEBUG		if KGDB
- 	select ARCH_HAS_ELF_RANDOMIZE
-	select ARCH_HAS_EXECMEM_ROX		if X86_64
-+	select ARCH_HAS_EXECMEM_ROX		if X86_64 && STRICT_MODULE_RWX
- 	select ARCH_HAS_FAST_MULTIPLIER
- 	select ARCH_HAS_FORTIFY_SOURCE
- 	select ARCH_HAS_GCOV_PROFILE_ALL
--- a/debian/patches/patchset-pf/fixes/0040-x86-its-move-its_pages-array-to-struct-mod_arch_spec.patch
+++ b/debian/patches/patchset-pf/fixes/0040-x86-its-move-its_pages-array-to-struct-mod_arch_spec.patch
@@ -1,110 +0,0 @@
-From 24fd2e3cef1b98f4417b8015ba24a8a4dcaae0c1 Mon Sep 17 00:00:00 2001
-From: "Mike Rapoport (Microsoft)" <rppt@kernel.org>
-Date: Tue, 3 Jun 2025 14:14:43 +0300
-Subject: x86/its: move its_pages array to struct mod_arch_specific
-
-The of pages with ITS thunks allocated for modules are tracked by an
-array in 'struct module'.
-
-Since this is very architecture specific data structure, move it to
-'struct mod_arch_specific'.
-
-No functional changes.
-
-Fixes: 872df34d7c51 ("x86/its: Use dynamic thunks for indirect branches")
-Suggested-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Signed-off-by: Mike Rapoport (Microsoft) <rppt@kernel.org>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Cc: stable@vger.kernel.org
-Link: https://lkml.kernel.org/r/20250603111446.2609381-4-rppt@kernel.org
---
- arch/x86/include/asm/module.h |  8 ++++++++
- arch/x86/kernel/alternative.c | 19 ++++++++++---------
- include/linux/module.h        |  5 -----
- 3 files changed, 18 insertions(+), 14 deletions(-)
-
--- a/arch/x86/include/asm/module.h
-+++ b/arch/x86/include/asm/module.h
-@@ -5,12 +5,20 @@
- #include <asm-generic/module.h>
- #include <asm/orc_types.h>
- 
-+struct its_array {
-+#ifdef CONFIG_MITIGATION_ITS
-+	void **pages;
-+	int num;
-+#endif
-+};
-+
- struct mod_arch_specific {
- #ifdef CONFIG_UNWINDER_ORC
- 	unsigned int num_orcs;
- 	int *orc_unwind_ip;
- 	struct orc_entry *orc_unwind;
- #endif
-+	struct its_array its_pages;
- };
- 
- #endif /* _ASM_X86_MODULE_H */
--- a/arch/x86/kernel/alternative.c
-+++ b/arch/x86/kernel/alternative.c
-@@ -195,8 +195,8 @@ void its_fini_mod(struct module *mod)
- 	its_page = NULL;
- 	mutex_unlock(&text_mutex);
- 
-	for (int i = 0; i < mod->its_num_pages; i++) {
-		void *page = mod->its_page_array[i];
-+	for (int i = 0; i < mod->arch.its_pages.num; i++) {
-+		void *page = mod->arch.its_pages.pages[i];
- 		execmem_restore_rox(page, PAGE_SIZE);
- 	}
- }
-@@ -206,11 +206,11 @@ void its_free_mod(struct module *mod)
- 	if (!cpu_feature_enabled(X86_FEATURE_INDIRECT_THUNK_ITS))
- 		return;
- 
-	for (int i = 0; i < mod->its_num_pages; i++) {
-		void *page = mod->its_page_array[i];
-+	for (int i = 0; i < mod->arch.its_pages.num; i++) {
-+		void *page = mod->arch.its_pages.pages[i];
- 		execmem_free(page);
- 	}
-	kfree(mod->its_page_array);
-+	kfree(mod->arch.its_pages.pages);
- }
- #endif /* CONFIG_MODULES */
- 
-@@ -223,14 +223,15 @@ static void *its_alloc(void)
- 
- #ifdef CONFIG_MODULES
- 	if (its_mod) {
-		void *tmp = krealloc(its_mod->its_page_array,
-				     (its_mod->its_num_pages+1) * sizeof(void *),
-+		struct its_array *pages = &its_mod->arch.its_pages;
-+		void *tmp = krealloc(pages->pages,
-+				     (pages->num+1) * sizeof(void *),
- 				     GFP_KERNEL);
- 		if (!tmp)
- 			return NULL;
- 
-		its_mod->its_page_array = tmp;
-		its_mod->its_page_array[its_mod->its_num_pages++] = page;
-+		pages->pages = tmp;
-+		pages->pages[pages->num++] = page;
- 
- 		execmem_make_temp_rw(page, PAGE_SIZE);
- 	}
--- a/include/linux/module.h
-+++ b/include/linux/module.h
-@@ -586,11 +586,6 @@ struct module {
- 	atomic_t refcnt;
- #endif
- 
-#ifdef CONFIG_MITIGATION_ITS
-	int its_num_pages;
-	void **its_page_array;
-#endif
-
- #ifdef CONFIG_CONSTRUCTORS
- 	/* Constructor functions. */
- 	ctor_fn_t *ctors;
--- a/debian/patches/patchset-pf/fixes/0041-x86-its-explicitly-manage-permissions-for-ITS-pages.patch
+++ b/debian/patches/patchset-pf/fixes/0041-x86-its-explicitly-manage-permissions-for-ITS-pages.patch
@@ -1,148 +0,0 @@
-From 48d82c4dd03de376a6f673bda0f4f2b97138d855 Mon Sep 17 00:00:00 2001
-From: "Peter Zijlstra (Intel)" <peterz@infradead.org>
-Date: Tue, 3 Jun 2025 14:14:44 +0300
-Subject: x86/its: explicitly manage permissions for ITS pages
-
-execmem_alloc() sets permissions differently depending on the kernel
-configuration, CPU support for PSE and whether a page is allocated
-before or after mark_rodata_ro().
-
-Add tracking for pages allocated for ITS when patching the core kernel
-and make sure the permissions for ITS pages are explicitly managed for
-both kernel and module allocations.
-
-Fixes: 872df34d7c51 ("x86/its: Use dynamic thunks for indirect branches")
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Co-developed-by: Mike Rapoport (Microsoft) <rppt@kernel.org>
-Signed-off-by: Mike Rapoport (Microsoft) <rppt@kernel.org>
-Signed-off-by: Peter Zijlstra (Intel) <peterz@infradead.org>
-Reviewed-by: Nikolay Borisov <nik.borisov@suse.com>
-Cc: stable@vger.kernel.org
-Link: https://lkml.kernel.org/r/20250603111446.2609381-5-rppt@kernel.org
---
- arch/x86/kernel/alternative.c | 74 ++++++++++++++++++++++++-----------
- 1 file changed, 52 insertions(+), 22 deletions(-)
-
--- a/arch/x86/kernel/alternative.c
-+++ b/arch/x86/kernel/alternative.c
-@@ -138,6 +138,24 @@ static struct module *its_mod;
- #endif
- static void *its_page;
- static unsigned int its_offset;
-+struct its_array its_pages;
-+
-+static void *__its_alloc(struct its_array *pages)
-+{
-+	void *page __free(execmem) = execmem_alloc(EXECMEM_MODULE_TEXT, PAGE_SIZE);
-+	if (!page)
-+		return NULL;
-+
-+	void *tmp = krealloc(pages->pages, (pages->num+1) * sizeof(void *),
-+			     GFP_KERNEL);
-+	if (!tmp)
-+		return NULL;
-+
-+	pages->pages = tmp;
-+	pages->pages[pages->num++] = page;
-+
-+	return no_free_ptr(page);
-+}
- 
- /* Initialize a thunk with the "jmp *reg; int3" instructions. */
- static void *its_init_thunk(void *thunk, int reg)
-@@ -173,6 +191,21 @@ static void *its_init_thunk(void *thunk,
- 	return thunk + offset;
- }
- 
-+static void its_pages_protect(struct its_array *pages)
-+{
-+	for (int i = 0; i < pages->num; i++) {
-+		void *page = pages->pages[i];
-+		execmem_restore_rox(page, PAGE_SIZE);
-+	}
-+}
-+
-+static void its_fini_core(void)
-+{
-+	if (IS_ENABLED(CONFIG_STRICT_KERNEL_RWX))
-+		its_pages_protect(&its_pages);
-+	kfree(its_pages.pages);
-+}
-+
- #ifdef CONFIG_MODULES
- void its_init_mod(struct module *mod)
- {
-@@ -195,10 +228,8 @@ void its_fini_mod(struct module *mod)
- 	its_page = NULL;
- 	mutex_unlock(&text_mutex);
- 
-	for (int i = 0; i < mod->arch.its_pages.num; i++) {
-		void *page = mod->arch.its_pages.pages[i];
-		execmem_restore_rox(page, PAGE_SIZE);
-	}
-+	if (IS_ENABLED(CONFIG_STRICT_MODULE_RWX))
-+		its_pages_protect(&mod->arch.its_pages);
- }
- 
- void its_free_mod(struct module *mod)
-@@ -216,28 +247,23 @@ void its_free_mod(struct module *mod)
- 
- static void *its_alloc(void)
- {
-	void *page __free(execmem) = execmem_alloc(EXECMEM_MODULE_TEXT, PAGE_SIZE);
-+	struct its_array *pages = &its_pages;
-+	void *page;
- 
-+#ifdef CONFIG_MODULE
-+	if (its_mod)
-+		pages = &its_mod->arch.its_pages;
-+#endif
-+
-+	page = __its_alloc(pages);
- 	if (!page)
- 		return NULL;
- 
-#ifdef CONFIG_MODULES
-	if (its_mod) {
-		struct its_array *pages = &its_mod->arch.its_pages;
-		void *tmp = krealloc(pages->pages,
-				     (pages->num+1) * sizeof(void *),
-				     GFP_KERNEL);
-		if (!tmp)
-			return NULL;
-
-		pages->pages = tmp;
-		pages->pages[pages->num++] = page;
-+	execmem_make_temp_rw(page, PAGE_SIZE);
-+	if (pages == &its_pages)
-+		set_memory_x((unsigned long)page, 1);
- 
-		execmem_make_temp_rw(page, PAGE_SIZE);
-	}
-#endif /* CONFIG_MODULES */
-
-	return no_free_ptr(page);
-+	return page;
- }
- 
- static void *its_allocate_thunk(int reg)
-@@ -291,7 +317,9 @@ u8 *its_static_thunk(int reg)
- 	return thunk;
- }
- 
-#endif
-+#else
-+static inline void its_fini_core(void) {}
-+#endif /* CONFIG_MITIGATION_ITS */
- 
- /*
-  * Nomenclature for variable names to simplify and clarify this code and ease
-@@ -2368,6 +2396,8 @@ void __init alternative_instructions(voi
- 	apply_retpolines(__retpoline_sites, __retpoline_sites_end);
- 	apply_returns(__return_sites, __return_sites_end);
- 
-+	its_fini_core();
-+
- 	/*
- 	 * Adjust all CALL instructions to point to func()-10, including
- 	 * those in .altinstr_replacement.
--- a/debian/patches/patchset-pf/fixes/0042-KVM-SVM-Clear-current_vmcb-during-vCPU-free-for-all-.patch
+++ b/debian/patches/patchset-pf/fixes/0042-KVM-SVM-Clear-current_vmcb-during-vCPU-free-for-all-.patch
@@ -1,32 +0,0 @@
-From 9bed8caa4c73f2d524d9600c74e6cbcff71c2456 Mon Sep 17 00:00:00 2001
-From: Yosry Ahmed <yosry.ahmed@linux.dev>
-Date: Tue, 29 Apr 2025 08:32:15 -0700
-Subject: KVM: SVM: Clear current_vmcb during vCPU free for all *possible* CPUs
-
-When freeing a vCPU and thus its VMCB, clear current_vmcb for all possible
-CPUs, not just online CPUs, as it's theoretically possible a CPU could go
-offline and come back online in conjunction with KVM reusing the page for
-a new VMCB.
-
-Link: https://lore.kernel.org/all/20250320013759.3965869-1-yosry.ahmed@linux.dev
-Fixes: fd65d3142f73 ("kvm: svm: Ensure an IBPB on all affected CPUs when freeing a vmcb")
-Cc: stable@vger.kernel.org
-Cc: Jim Mattson <jmattson@google.com>
-Signed-off-by: Yosry Ahmed <yosry.ahmed@linux.dev>
-[sean: split to separate patch, write changelog]
-Signed-off-by: Sean Christopherson <seanjc@google.com>
---
- arch/x86/kvm/svm/svm.c | 2 +-
- 1 file changed, 1 insertion(+), 1 deletion(-)
-
--- a/arch/x86/kvm/svm/svm.c
-+++ b/arch/x86/kvm/svm/svm.c
-@@ -1488,7 +1488,7 @@ static void svm_clear_current_vmcb(struc
- {
- 	int i;
- 
-	for_each_online_cpu(i)
-+	for_each_possible_cpu(i)
- 		cmpxchg(per_cpu_ptr(&svm_data.current_vmcb, i), vmcb, NULL);
- }
- 
--- a/debian/patches/patchset-pf/fixes/0043-KVM-VMX-Flush-shadow-VMCS-on-emergency-reboot.patch
+++ b/debian/patches/patchset-pf/fixes/0043-KVM-VMX-Flush-shadow-VMCS-on-emergency-reboot.patch
@@ -1,43 +0,0 @@
-From d74cb6c8b70d9b5ad8482f4821679b83bad9de63 Mon Sep 17 00:00:00 2001
-From: Chao Gao <chao.gao@intel.com>
-Date: Mon, 24 Mar 2025 22:08:48 +0800
-Subject: KVM: VMX: Flush shadow VMCS on emergency reboot
-
-Ensure the shadow VMCS cache is evicted during an emergency reboot to
-prevent potential memory corruption if the cache is evicted after reboot.
-
-This issue was identified through code inspection, as __loaded_vmcs_clear()
-flushes both the normal VMCS and the shadow VMCS.
-
-Avoid checking the "launched" state during an emergency reboot, unlike the
-behavior in __loaded_vmcs_clear(). This is important because reboot NMIs
-can interfere with operations like copy_shadow_to_vmcs12(), where shadow
-VMCSes are loaded directly using VMPTRLD. In such cases, if NMIs occur
-right after the VMCS load, the shadow VMCSes will be active but the
-"launched" state may not be set.
-
-Fixes: 16f5b9034b69 ("KVM: nVMX: Copy processor-specific shadow-vmcs to VMCS12")
-Cc: stable@vger.kernel.org
-Signed-off-by: Chao Gao <chao.gao@intel.com>
-Reviewed-by: Kai Huang <kai.huang@intel.com>
-Link: https://lore.kernel.org/r/20250324140849.2099723-1-chao.gao@intel.com
-Signed-off-by: Sean Christopherson <seanjc@google.com>
---
- arch/x86/kvm/vmx/vmx.c | 5 ++++-
- 1 file changed, 4 insertions(+), 1 deletion(-)
-
--- a/arch/x86/kvm/vmx/vmx.c
-+++ b/arch/x86/kvm/vmx/vmx.c
-@@ -769,8 +769,11 @@ void vmx_emergency_disable_virtualizatio
- 		return;
- 
- 	list_for_each_entry(v, &per_cpu(loaded_vmcss_on_cpu, cpu),
-			    loaded_vmcss_on_cpu_link)
-+			    loaded_vmcss_on_cpu_link) {
- 		vmcs_clear(v->vmcs);
-+		if (v->shadow_vmcs)
-+			vmcs_clear(v->shadow_vmcs);
-+	}
- 
- 	kvm_cpu_vmxoff();
- }
--- a/debian/patches/patchset-pf/fixes/0044-cgroup-freezer-fix-incomplete-freezing-when-attachin.patch
+++ b/debian/patches/patchset-pf/fixes/0044-cgroup-freezer-fix-incomplete-freezing-when-attachin.patch
@@ -1,64 +0,0 @@
-From 6e492900893c011cbe13fbb881cf1e11df08982b Mon Sep 17 00:00:00 2001
-From: Chen Ridong <chenridong@huawei.com>
-Date: Wed, 18 Jun 2025 07:32:17 +0000
-Subject: cgroup,freezer: fix incomplete freezing when attaching tasks
-MIME-Version: 1.0
-Content-Type: text/plain; charset=UTF-8
-Content-Transfer-Encoding: 8bit
-
-An issue was found:
-
-	# cd /sys/fs/cgroup/freezer/
-	# mkdir test
-	# echo FROZEN > test/freezer.state
-	# cat test/freezer.state
-	FROZEN
-	# sleep 1000 &
-	[1] 863
-	# echo 863 > test/cgroup.procs
-	# cat test/freezer.state
-	FREEZING
-
-When tasks are migrated to a frozen cgroup, the freezer fails to
-immediately freeze the tasks, causing the cgroup to remain in the
-"FREEZING".
-
-The freeze_task() function is called before clearing the CGROUP_FROZEN
-flag. This causes the freezing() check to incorrectly return false,
-preventing __freeze_task() from being invoked for the migrated task.
-
-To fix this issue, clear the CGROUP_FROZEN state before calling
-freeze_task().
-
-Fixes: f5d39b020809 ("freezer,sched: Rewrite core freezer logic")
-Cc: stable@vger.kernel.org # v6.1+
-Reported-by: Zhong Jiawei <zhongjiawei1@huawei.com>
-Signed-off-by: Chen Ridong <chenridong@huawei.com>
-Acked-by: Michal Koutný <mkoutny@suse.com>
-Signed-off-by: Tejun Heo <tj@kernel.org>
---
- kernel/cgroup/legacy_freezer.c | 3 +--
- 1 file changed, 1 insertion(+), 2 deletions(-)
-
-diff --git a/kernel/cgroup/legacy_freezer.c b/kernel/cgroup/legacy_freezer.c
-index 039d1eb2f215..507b8f19a262 100644
--- a/kernel/cgroup/legacy_freezer.c
-+++ b/kernel/cgroup/legacy_freezer.c
-@@ -188,13 +188,12 @@ static void freezer_attach(struct cgroup_taskset *tset)
- 		if (!(freezer->state & CGROUP_FREEZING)) {
- 			__thaw_task(task);
- 		} else {
-			freeze_task(task);
-
- 			/* clear FROZEN and propagate upwards */
- 			while (freezer && (freezer->state & CGROUP_FROZEN)) {
- 				freezer->state &= ~CGROUP_FROZEN;
- 				freezer = parent_freezer(freezer);
- 			}
-+			freeze_task(task);
- 		}
- 	}
- 
-- 
-2.50.0
-
--- a/debian/patches/patchset-pf/nfs/0001-NFSD-unregister-filesystem-in-case-genl_register_fam.patch
+++ b/debian/patches/patchset-pf/nfs/0001-NFSD-unregister-filesystem-in-case-genl_register_fam.patch
@@ -1,39 +0,0 @@
-From ef4d2ebb50f1bd0d5b2e3f1aa2280d7d31e4a3c9 Mon Sep 17 00:00:00 2001
-From: Maninder Singh <maninder1.s@samsung.com>
-Date: Thu, 6 Mar 2025 14:50:06 +0530
-Subject: NFSD: unregister filesystem in case genl_register_family() fails
-
-With rpc_status netlink support, unregister of register_filesystem()
-was missed in case of genl_register_family() fails.
-
-Correcting it by making new label.
-
-Fixes: bd9d6a3efa97 ("NFSD: add rpc_status netlink support")
-Cc: stable@vger.kernel.org
-Signed-off-by: Maninder Singh <maninder1.s@samsung.com>
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- fs/nfsd/nfsctl.c | 4 +++-
- 1 file changed, 3 insertions(+), 1 deletion(-)
-
--- a/fs/nfsd/nfsctl.c
-+++ b/fs/nfsd/nfsctl.c
-@@ -2305,7 +2305,7 @@ static int __init init_nfsd(void)
- 		goto out_free_cld;
- 	retval = register_filesystem(&nfsd_fs_type);
- 	if (retval)
-		goto out_free_all;
-+		goto out_free_nfsd4;
- 	retval = genl_register_family(&nfsd_nl_family);
- 	if (retval)
- 		goto out_free_all;
-@@ -2313,6 +2313,8 @@ static int __init init_nfsd(void)
- 
- 	return 0;
- out_free_all:
-+	unregister_filesystem(&nfsd_fs_type);
-+out_free_nfsd4:
- 	nfsd4_destroy_laundry_wq();
- out_free_cld:
- 	unregister_cld_notifier();
--- a/debian/patches/patchset-pf/nfs/0002-NFSD-fix-race-between-nfsd-registration-and-exports_.patch
+++ b/debian/patches/patchset-pf/nfs/0002-NFSD-fix-race-between-nfsd-registration-and-exports_.patch
@@ -1,162 +0,0 @@
-From 6c2a6b3e27a3a02fd9f3f92458d4995014dfe69f Mon Sep 17 00:00:00 2001
-From: Maninder Singh <maninder1.s@samsung.com>
-Date: Thu, 6 Mar 2025 14:50:07 +0530
-Subject: NFSD: fix race between nfsd registration and exports_proc
-
-As of now nfsd calls create_proc_exports_entry() at start of init_nfsd
-and cleanup by remove_proc_entry() at last of exit_nfsd.
-
-Which causes kernel OOPs if there is race between below 2 operations:
-(i) exportfs -r
-(ii) mount -t nfsd none /proc/fs/nfsd
-
-for 5.4 kernel ARM64:
-
-CPU 1:
-el1_irq+0xbc/0x180
-arch_counter_get_cntvct+0x14/0x18
-running_clock+0xc/0x18
-preempt_count_add+0x88/0x110
-prep_new_page+0xb0/0x220
-get_page_from_freelist+0x2d8/0x1778
-__alloc_pages_nodemask+0x15c/0xef0
-__vmalloc_node_range+0x28c/0x478
-__vmalloc_node_flags_caller+0x8c/0xb0
-kvmalloc_node+0x88/0xe0
-nfsd_init_net+0x6c/0x108 [nfsd]
-ops_init+0x44/0x170
-register_pernet_operations+0x114/0x270
-register_pernet_subsys+0x34/0x50
-init_nfsd+0xa8/0x718 [nfsd]
-do_one_initcall+0x54/0x2e0
-
-CPU 2 :
-Unable to handle kernel NULL pointer dereference at virtual address 0000000000000010
-
-PC is at : exports_net_open+0x50/0x68 [nfsd]
-
-Call trace:
-exports_net_open+0x50/0x68 [nfsd]
-exports_proc_open+0x2c/0x38 [nfsd]
-proc_reg_open+0xb8/0x198
-do_dentry_open+0x1c4/0x418
-vfs_open+0x38/0x48
-path_openat+0x28c/0xf18
-do_filp_open+0x70/0xe8
-do_sys_open+0x154/0x248
-
-Sometimes it crashes at exports_net_open() and sometimes cache_seq_next_rcu().
-
-and same is happening on latest 6.14 kernel as well:
-
-[    0.000000] Linux version 6.14.0-rc5-next-20250304-dirty
-...
-[  285.455918] Unable to handle kernel paging request at virtual address 00001f4800001f48
-...
-[  285.464902] pc : cache_seq_next_rcu+0x78/0xa4
-...
-[  285.469695] Call trace:
-[  285.470083]  cache_seq_next_rcu+0x78/0xa4 (P)
-[  285.470488]  seq_read+0xe0/0x11c
-[  285.470675]  proc_reg_read+0x9c/0xf0
-[  285.470874]  vfs_read+0xc4/0x2fc
-[  285.471057]  ksys_read+0x6c/0xf4
-[  285.471231]  __arm64_sys_read+0x1c/0x28
-[  285.471428]  invoke_syscall+0x44/0x100
-[  285.471633]  el0_svc_common.constprop.0+0x40/0xe0
-[  285.471870]  do_el0_svc_compat+0x1c/0x34
-[  285.472073]  el0_svc_compat+0x2c/0x80
-[  285.472265]  el0t_32_sync_handler+0x90/0x140
-[  285.472473]  el0t_32_sync+0x19c/0x1a0
-[  285.472887] Code: f9400885 93407c23 937d7c27 11000421 (f86378a3)
-[  285.473422] ---[ end trace 0000000000000000 ]---
-
-It reproduced simply with below script:
-while [ 1 ]
-do
-/exportfs -r
-done &
-
-while [ 1 ]
-do
-insmod /nfsd.ko
-mount -t nfsd none /proc/fs/nfsd
-umount /proc/fs/nfsd
-rmmod nfsd
-done &
-
-So exporting interfaces to user space shall be done at last and
-cleanup at first place.
-
-With change there is no Kernel OOPs.
-
-Co-developed-by: Shubham Rana <s9.rana@samsung.com>
-Signed-off-by: Shubham Rana <s9.rana@samsung.com>
-Signed-off-by: Maninder Singh <maninder1.s@samsung.com>
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Cc: stable@vger.kernel.org
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- fs/nfsd/nfsctl.c | 17 ++++++++---------
- 1 file changed, 8 insertions(+), 9 deletions(-)
-
--- a/fs/nfsd/nfsctl.c
-+++ b/fs/nfsd/nfsctl.c
-@@ -2291,12 +2291,9 @@ static int __init init_nfsd(void)
- 	if (retval)
- 		goto out_free_pnfs;
- 	nfsd_lockd_init();	/* lockd->nfsd callbacks */
-	retval = create_proc_exports_entry();
-	if (retval)
-		goto out_free_lockd;
- 	retval = register_pernet_subsys(&nfsd_net_ops);
- 	if (retval < 0)
-		goto out_free_exports;
-+		goto out_free_lockd;
- 	retval = register_cld_notifier();
- 	if (retval)
- 		goto out_free_subsys;
-@@ -2308,11 +2305,16 @@ static int __init init_nfsd(void)
- 		goto out_free_nfsd4;
- 	retval = genl_register_family(&nfsd_nl_family);
- 	if (retval)
-+		goto out_free_filesystem;
-+	retval = create_proc_exports_entry();
-+	if (retval)
- 		goto out_free_all;
- 	nfsd_localio_ops_init();
- 
- 	return 0;
- out_free_all:
-+	genl_unregister_family(&nfsd_nl_family);
-+out_free_filesystem:
- 	unregister_filesystem(&nfsd_fs_type);
- out_free_nfsd4:
- 	nfsd4_destroy_laundry_wq();
-@@ -2320,9 +2322,6 @@ out_free_cld:
- 	unregister_cld_notifier();
- out_free_subsys:
- 	unregister_pernet_subsys(&nfsd_net_ops);
-out_free_exports:
-	remove_proc_entry("fs/nfs/exports", NULL);
-	remove_proc_entry("fs/nfs", NULL);
- out_free_lockd:
- 	nfsd_lockd_shutdown();
- 	nfsd_drc_slab_free();
-@@ -2335,14 +2334,14 @@ out_free_slabs:
- 
- static void __exit exit_nfsd(void)
- {
-+	remove_proc_entry("fs/nfs/exports", NULL);
-+	remove_proc_entry("fs/nfs", NULL);
- 	genl_unregister_family(&nfsd_nl_family);
- 	unregister_filesystem(&nfsd_fs_type);
- 	nfsd4_destroy_laundry_wq();
- 	unregister_cld_notifier();
- 	unregister_pernet_subsys(&nfsd_net_ops);
- 	nfsd_drc_slab_free();
-	remove_proc_entry("fs/nfs/exports", NULL);
-	remove_proc_entry("fs/nfs", NULL);
- 	nfsd_lockd_shutdown();
- 	nfsd4_free_slabs();
- 	nfsd4_exit_pnfs();
--- a/debian/patches/patchset-pf/nfs/0003-nfsd-fix-access-checking-for-NLM-under-XPRTSEC-polic.patch
+++ b/debian/patches/patchset-pf/nfs/0003-nfsd-fix-access-checking-for-NLM-under-XPRTSEC-polic.patch
@@ -1,35 +0,0 @@
-From 0d4fc17cb5da09d14dbff91da7e28e50d3f54af2 Mon Sep 17 00:00:00 2001
-From: Olga Kornievskaia <okorniev@redhat.com>
-Date: Fri, 21 Mar 2025 20:13:04 -0400
-Subject: nfsd: fix access checking for NLM under XPRTSEC policies
-
-When an export policy with xprtsec policy is set with "tls"
-and/or "mtls", but an NFS client is doing a v3 xprtsec=tls
-mount, then NLM locking calls fail with an error because
-there is currently no support for NLM with TLS.
-
-Until such support is added, allow NLM calls under TLS-secured
-policy.
-
-Fixes: 4cc9b9f2bf4d ("nfsd: refine and rename NFSD_MAY_LOCK")
-Cc: stable@vger.kernel.org
-Signed-off-by: Olga Kornievskaia <okorniev@redhat.com>
-Reviewed-by: NeilBrown <neil@brown.name>
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- fs/nfsd/export.c | 3 ++-
- 1 file changed, 2 insertions(+), 1 deletion(-)
-
--- a/fs/nfsd/export.c
-+++ b/fs/nfsd/export.c
-@@ -1124,7 +1124,8 @@ __be32 check_nfsd_access(struct svc_expo
- 		    test_bit(XPT_PEER_AUTH, &xprt->xpt_flags))
- 			goto ok;
- 	}
-	goto denied;
-+	if (!may_bypass_gss)
-+		goto denied;
- 
- ok:
- 	/* legacy gss-only clients are always OK: */
--- a/debian/patches/patchset-pf/nfs/0004-nfsd-nfsd4_spo_must_allow-must-check-this-is-a-v4-co.patch
+++ b/debian/patches/patchset-pf/nfs/0004-nfsd-nfsd4_spo_must_allow-must-check-this-is-a-v4-co.patch
@@ -1,32 +0,0 @@
-From 2fa924062a9494772cd997cb8b1ec572cfe6490f Mon Sep 17 00:00:00 2001
-From: NeilBrown <neil@brown.name>
-Date: Fri, 28 Mar 2025 11:05:59 +1100
-Subject: nfsd: nfsd4_spo_must_allow() must check this is a v4 compound request
-
-If the request being processed is not a v4 compound request, then
-examining the cstate can have undefined results.
-
-This patch adds a check that the rpc procedure being executed
-(rq_procinfo) is the NFSPROC4_COMPOUND procedure.
-
-Reported-by: Olga Kornievskaia <okorniev@redhat.com>
-Cc: stable@vger.kernel.org
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Signed-off-by: NeilBrown <neil@brown.name>
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- fs/nfsd/nfs4proc.c | 3 ++-
- 1 file changed, 2 insertions(+), 1 deletion(-)
-
--- a/fs/nfsd/nfs4proc.c
-+++ b/fs/nfsd/nfs4proc.c
-@@ -3766,7 +3766,8 @@ bool nfsd4_spo_must_allow(struct svc_rqs
- 	struct nfs4_op_map *allow = &cstate->clp->cl_spo_must_allow;
- 	u32 opiter;
- 
-	if (!cstate->minorversion)
-+	if (rqstp->rq_procinfo != &nfsd_version4.vs_proc[NFSPROC4_COMPOUND] ||
-+	    cstate->minorversion == 0)
- 		return false;
- 
- 	if (cstate->spo_must_allowed)
--- a/debian/patches/patchset-pf/nfs/0005-nfsd-Initialize-ssc-before-laundromat_work-to-preven.patch
+++ b/debian/patches/patchset-pf/nfs/0005-nfsd-Initialize-ssc-before-laundromat_work-to-preven.patch
@@ -1,47 +0,0 @@
-From c860b8340bf921de66aa7871f40507dd5628926f Mon Sep 17 00:00:00 2001
-From: Li Lingfeng <lilingfeng3@huawei.com>
-Date: Mon, 14 Apr 2025 22:38:52 +0800
-Subject: nfsd: Initialize ssc before laundromat_work to prevent NULL
- dereference
-
-In nfs4_state_start_net(), laundromat_work may access nfsd_ssc through
-nfs4_laundromat -> nfsd4_ssc_expire_umount. If nfsd_ssc isn't initialized,
-this can cause NULL pointer dereference.
-
-Normally the delayed start of laundromat_work allows sufficient time for
-nfsd_ssc initialization to complete. However, when the kernel waits too
-long for userspace responses (e.g. in nfs4_state_start_net ->
-nfsd4_end_grace -> nfsd4_record_grace_done -> nfsd4_cld_grace_done ->
-cld_pipe_upcall -> __cld_pipe_upcall -> wait_for_completion path), the
-delayed work may start before nfsd_ssc initialization finishes.
-
-Fix this by moving nfsd_ssc initialization before starting laundromat_work.
-
-Fixes: f4e44b393389 ("NFSD: delay unmount source's export after inter-server copy completed.")
-Cc: stable@vger.kernel.org
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Signed-off-by: Li Lingfeng <lilingfeng3@huawei.com>
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- fs/nfsd/nfssvc.c | 6 +++---
- 1 file changed, 3 insertions(+), 3 deletions(-)
-
--- a/fs/nfsd/nfssvc.c
-+++ b/fs/nfsd/nfssvc.c
-@@ -396,13 +396,13 @@ static int nfsd_startup_net(struct net *
- 	if (ret)
- 		goto out_filecache;
- 
-+#ifdef CONFIG_NFSD_V4_2_INTER_SSC
-+	nfsd4_ssc_init_umount_work(nn);
-+#endif
- 	ret = nfs4_state_start_net(net);
- 	if (ret)
- 		goto out_reply_cache;
- 
-#ifdef CONFIG_NFSD_V4_2_INTER_SSC
-	nfsd4_ssc_init_umount_work(nn);
-#endif
- 	nn->nfsd_net_up = true;
- 	return 0;
- 
--- a/debian/patches/patchset-pf/nfs/0006-NFSD-Implement-FATTR4_CLONE_BLKSIZE-attribute.patch
+++ b/debian/patches/patchset-pf/nfs/0006-NFSD-Implement-FATTR4_CLONE_BLKSIZE-attribute.patch
@@ -1,62 +0,0 @@
-From 01089ae8fff5bcc6e9949d50d76b70f2a16abe89 Mon Sep 17 00:00:00 2001
-From: Chuck Lever <chuck.lever@oracle.com>
-Date: Wed, 7 May 2025 10:45:15 -0400
-Subject: NFSD: Implement FATTR4_CLONE_BLKSIZE attribute
-
-RFC 7862 states that if an NFS server implements a CLONE operation,
-it MUST also implement FATTR4_CLONE_BLKSIZE. NFSD implements CLONE,
-but does not implement FATTR4_CLONE_BLKSIZE.
-
-Note that in Section 12.2, RFC 7862 claims that
-FATTR4_CLONE_BLKSIZE is RECOMMENDED, not REQUIRED. Likely this is
-because a minor version is not permitted to add a REQUIRED
-attribute. Confusing.
-
-We assume this attribute reports a block size as a count of bytes,
-as RFC 7862 does not specify a unit.
-
-Reported-by: Roland Mainz <roland.mainz@nrubsig.org>
-Suggested-by: Christoph Hellwig <hch@infradead.org>
-Reviewed-by: Roland Mainz <roland.mainz@nrubsig.org>
-Cc: stable@vger.kernel.org # v6.7+
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Signed-off-by: Chuck Lever <chuck.lever@oracle.com>
---
- fs/nfsd/nfs4xdr.c | 19 ++++++++++++++++++-
- 1 file changed, 18 insertions(+), 1 deletion(-)
-
--- a/fs/nfsd/nfs4xdr.c
-+++ b/fs/nfsd/nfs4xdr.c
-@@ -3391,6 +3391,23 @@ static __be32 nfsd4_encode_fattr4_suppat
- 	return nfsd4_encode_bitmap4(xdr, supp[0], supp[1], supp[2]);
- }
- 
-+/*
-+ * Copied from generic_remap_checks/generic_remap_file_range_prep.
-+ *
-+ * These generic functions use the file system's s_blocksize, but
-+ * individual file systems aren't required to use
-+ * generic_remap_file_range_prep. Until there is a mechanism for
-+ * determining a particular file system's (or file's) clone block
-+ * size, this is the best NFSD can do.
-+ */
-+static __be32 nfsd4_encode_fattr4_clone_blksize(struct xdr_stream *xdr,
-+						const struct nfsd4_fattr_args *args)
-+{
-+	struct inode *inode = d_inode(args->dentry);
-+
-+	return nfsd4_encode_uint32_t(xdr, inode->i_sb->s_blocksize);
-+}
-+
- #ifdef CONFIG_NFSD_V4_SECURITY_LABEL
- static __be32 nfsd4_encode_fattr4_sec_label(struct xdr_stream *xdr,
- 					    const struct nfsd4_fattr_args *args)
-@@ -3545,7 +3562,7 @@ static const nfsd4_enc_attr nfsd4_enc_fa
- 	[FATTR4_MODE_SET_MASKED]	= nfsd4_encode_fattr4__noop,
- 	[FATTR4_SUPPATTR_EXCLCREAT]	= nfsd4_encode_fattr4_suppattr_exclcreat,
- 	[FATTR4_FS_CHARSET_CAP]		= nfsd4_encode_fattr4__noop,
-	[FATTR4_CLONE_BLKSIZE]		= nfsd4_encode_fattr4__noop,
-+	[FATTR4_CLONE_BLKSIZE]		= nfsd4_encode_fattr4_clone_blksize,
- 	[FATTR4_SPACE_FREED]		= nfsd4_encode_fattr4__noop,
- 	[FATTR4_CHANGE_ATTR_TYPE]	= nfsd4_encode_fattr4__noop,
- 
--- a/debian/patches/patchset-pf/nfs/0007-fs-nfs-read-fix-double-unlock-bug-in-nfs_return_empt.patch
+++ b/debian/patches/patchset-pf/nfs/0007-fs-nfs-read-fix-double-unlock-bug-in-nfs_return_empt.patch
@@ -1,65 +0,0 @@
-From e0246422dfc08dec0fc3c96f3201bab6ceec6774 Mon Sep 17 00:00:00 2001
-From: Max Kellermann <max.kellermann@ionos.com>
-Date: Wed, 23 Apr 2025 15:22:50 +0200
-Subject: fs/nfs/read: fix double-unlock bug in nfs_return_empty_folio()
-
-Sometimes, when a file was read while it was being truncated by
-another NFS client, the kernel could deadlock because folio_unlock()
-was called twice, and the second call would XOR back the `PG_locked`
-flag.
-
-Most of the time (depending on the timing of the truncation), nobody
-notices the problem because folio_unlock() gets called three times,
-which flips `PG_locked` back off:
-
- 1. vfs_read, nfs_read_folio, ... nfs_read_add_folio,
-    nfs_return_empty_folio
- 2. vfs_read, nfs_read_folio, ... netfs_read_collection,
-    netfs_unlock_abandoned_read_pages
- 3. vfs_read, ... nfs_do_read_folio, nfs_read_add_folio,
-    nfs_return_empty_folio
-
-The problem is that nfs_read_add_folio() is not supposed to unlock the
-folio if fscache is enabled, and a nfs_netfs_folio_unlock() check is
-missing in nfs_return_empty_folio().
-
-Rarely this leads to a warning in netfs_read_collection():
-
- ------------[ cut here ]------------
- R=0000031c: folio 10 is not locked
- WARNING: CPU: 0 PID: 29 at fs/netfs/read_collect.c:133 netfs_read_collection+0x7c0/0xf00
- [...]
- Workqueue: events_unbound netfs_read_collection_worker
- RIP: 0010:netfs_read_collection+0x7c0/0xf00
- [...]
- Call Trace:
-  <TASK>
-  netfs_read_collection_worker+0x67/0x80
-  process_one_work+0x12e/0x2c0
-  worker_thread+0x295/0x3a0
-
-Most of the time, however, processes just get stuck forever in
-folio_wait_bit_common(), waiting for `PG_locked` to disappear, which
-never happens because nobody is really holding the folio lock.
-
-Fixes: 000dbe0bec05 ("NFS: Convert buffered read paths to use netfs when fscache is enabled")
-Cc: stable@vger.kernel.org
-Signed-off-by: Max Kellermann <max.kellermann@ionos.com>
-Reviewed-by: Dave Wysochanski <dwysocha@redhat.com>
-Signed-off-by: Anna Schumaker <anna.schumaker@oracle.com>
---
- fs/nfs/read.c | 3 ++-
- 1 file changed, 2 insertions(+), 1 deletion(-)
-
--- a/fs/nfs/read.c
-+++ b/fs/nfs/read.c
-@@ -56,7 +56,8 @@ static int nfs_return_empty_folio(struct
- {
- 	folio_zero_segment(folio, 0, folio_size(folio));
- 	folio_mark_uptodate(folio);
-	folio_unlock(folio);
-+	if (nfs_netfs_folio_unlock(folio))
-+		folio_unlock(folio);
- 	return 0;
- }
- 
--- a/debian/patches/patchset-pf/nfs/0008-NFSv4-Don-t-check-for-OPEN-feature-support-in-v4.1.patch
+++ b/debian/patches/patchset-pf/nfs/0008-NFSv4-Don-t-check-for-OPEN-feature-support-in-v4.1.patch
@@ -1,32 +0,0 @@
-From d9f4762296075cc67d9974d093a87064075853e1 Mon Sep 17 00:00:00 2001
-From: Scott Mayhew <smayhew@redhat.com>
-Date: Wed, 30 Apr 2025 07:12:29 -0400
-Subject: NFSv4: Don't check for OPEN feature support in v4.1
-
-fattr4_open_arguments is a v4.2 recommended attribute, so we shouldn't
-be sending it to v4.1 servers.
-
-Fixes: cb78f9b7d0c0 ("nfs: fix the fetch of FATTR4_OPEN_ARGUMENTS")
-Signed-off-by: Scott Mayhew <smayhew@redhat.com>
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Reviewed-by: Benjamin Coddington <bcodding@redhat.com>
-Cc: stable@vger.kernel.org # 6.11+
-Signed-off-by: Anna Schumaker <anna.schumaker@oracle.com>
---
- fs/nfs/nfs4proc.c | 5 +++--
- 1 file changed, 3 insertions(+), 2 deletions(-)
-
--- a/fs/nfs/nfs4proc.c
-+++ b/fs/nfs/nfs4proc.c
-@@ -3976,8 +3976,9 @@ static int _nfs4_server_capabilities(str
- 		     FATTR4_WORD0_CASE_INSENSITIVE |
- 		     FATTR4_WORD0_CASE_PRESERVING;
- 	if (minorversion)
-		bitmask[2] = FATTR4_WORD2_SUPPATTR_EXCLCREAT |
-			     FATTR4_WORD2_OPEN_ARGUMENTS;
-+		bitmask[2] = FATTR4_WORD2_SUPPATTR_EXCLCREAT;
-+	if (minorversion > 1)
-+		bitmask[2] |= FATTR4_WORD2_OPEN_ARGUMENTS;
- 
- 	status = nfs4_call_sync(server->client, server, &msg, &args.seq_args, &res.seq_res, 0);
- 	if (status == 0) {
--- a/debian/patches/patchset-pf/nfs/0009-NFS-always-probe-for-LOCALIO-support-asynchronously.patch
+++ b/debian/patches/patchset-pf/nfs/0009-NFS-always-probe-for-LOCALIO-support-asynchronously.patch
@@ -1,96 +0,0 @@
-From 7147868788966e9032cdeb0cf33bd1ae47785088 Mon Sep 17 00:00:00 2001
-From: Mike Snitzer <snitzer@kernel.org>
-Date: Tue, 13 May 2025 12:08:31 -0400
-Subject: NFS: always probe for LOCALIO support asynchronously
-
-It was reported that NFS client mounts of AWS Elastic File System
-(EFS) volumes is slow, this is because the AWS firewall disallows
-LOCALIO (because it doesn't consider the use of NFS_LOCALIO_PROGRAM
-valid), see: https://bugzilla.redhat.com/show_bug.cgi?id=2335129
-
-Switch to performing the LOCALIO probe asynchronously to address the
-potential for the NFS LOCALIO protocol being disallowed and/or slowed
-by the remote server's response.
-
-While at it, fix nfs_local_probe_async() to always take/put a
-reference on the nfs_client that is using the LOCALIO protocol.
-Also, unexport the nfs_local_probe() symbol and make it private to
-fs/nfs/localio.c
-
-This change has the side-effect of initially issuing reads, writes and
-commits over the wire via SUNRPC until the LOCALIO probe completes.
-
-Suggested-by: Jeff Layton <jlayton@kernel.org> # to always probe async
-Fixes: 76d4cb6345da ("nfs: probe for LOCALIO when v4 client reconnects to server")
-Cc: stable@vger.kernel.org # 6.14+
-Signed-off-by: Mike Snitzer <snitzer@kernel.org>
-Reviewed-by: Jeff Layton <jlayton@kernel.org>
-Signed-off-by: Anna Schumaker <anna.schumaker@oracle.com>
---
- fs/nfs/client.c                           | 2 +-
- fs/nfs/flexfilelayout/flexfilelayoutdev.c | 2 +-
- fs/nfs/internal.h                         | 1 -
- fs/nfs/localio.c                          | 6 ++++--
- 4 files changed, 6 insertions(+), 5 deletions(-)
-
--- a/fs/nfs/client.c
-+++ b/fs/nfs/client.c
-@@ -439,7 +439,7 @@ struct nfs_client *nfs_get_client(const
- 			spin_unlock(&nn->nfs_client_lock);
- 			new = rpc_ops->init_client(new, cl_init);
- 			if (!IS_ERR(new))
-				 nfs_local_probe(new);
-+				 nfs_local_probe_async(new);
- 			return new;
- 		}
- 
--- a/fs/nfs/flexfilelayout/flexfilelayoutdev.c
-+++ b/fs/nfs/flexfilelayout/flexfilelayoutdev.c
-@@ -400,7 +400,7 @@ nfs4_ff_layout_prepare_ds(struct pnfs_la
- 		 * keep ds_clp even if DS is local, so that if local IO cannot
- 		 * proceed somehow, we can fall back to NFS whenever we want.
- 		 */
-		nfs_local_probe(ds->ds_clp);
-+		nfs_local_probe_async(ds->ds_clp);
- 		max_payload =
- 			nfs_block_size(rpc_max_payload(ds->ds_clp->cl_rpcclient),
- 				       NULL);
--- a/fs/nfs/internal.h
-+++ b/fs/nfs/internal.h
-@@ -455,7 +455,6 @@ extern int nfs_wait_bit_killable(struct
- 
- #if IS_ENABLED(CONFIG_NFS_LOCALIO)
- /* localio.c */
-extern void nfs_local_probe(struct nfs_client *);
- extern void nfs_local_probe_async(struct nfs_client *);
- extern void nfs_local_probe_async_work(struct work_struct *);
- extern struct nfsd_file *nfs_local_open_fh(struct nfs_client *,
--- a/fs/nfs/localio.c
-+++ b/fs/nfs/localio.c
-@@ -171,7 +171,7 @@ static bool nfs_server_uuid_is_local(str
-  * - called after alloc_client and init_client (so cl_rpcclient exists)
-  * - this function is idempotent, it can be called for old or new clients
-  */
-void nfs_local_probe(struct nfs_client *clp)
-+static void nfs_local_probe(struct nfs_client *clp)
- {
- 	/* Disallow localio if disabled via sysfs or AUTH_SYS isn't used */
- 	if (!localio_enabled ||
-@@ -191,14 +191,16 @@ void nfs_local_probe(struct nfs_client *
- 		nfs_localio_enable_client(clp);
- 	nfs_uuid_end(&clp->cl_uuid);
- }
-EXPORT_SYMBOL_GPL(nfs_local_probe);
- 
- void nfs_local_probe_async_work(struct work_struct *work)
- {
- 	struct nfs_client *clp =
- 		container_of(work, struct nfs_client, cl_local_probe_work);
- 
-+	if (!refcount_inc_not_zero(&clp->cl_count))
-+		return;
- 	nfs_local_probe(clp);
-+	nfs_put_client(clp);
- }
- 
- void nfs_local_probe_async(struct nfs_client *clp)
--- a/debian/patches/patchset-pf/smb/0001-smb-client-add-NULL-check-in-automount_fullpath.patch
+++ b/debian/patches/patchset-pf/smb/0001-smb-client-add-NULL-check-in-automount_fullpath.patch
@@ -1,29 +0,0 @@
-From 97831e31e43bb023d208b2344546a4e51e580dc6 Mon Sep 17 00:00:00 2001
-From: Ruben Devos <devosruben6@gmail.com>
-Date: Sun, 1 Jun 2025 19:18:55 +0200
-Subject: smb: client: add NULL check in automount_fullpath
-
-page is checked for null in __build_path_from_dentry_optional_prefix
-when tcon->origin_fullpath is not set. However, the check is missing when
-it is set.
-Add a check to prevent a potential NULL pointer dereference.
-
-Signed-off-by: Ruben Devos <devosruben6@gmail.com>
-Cc: stable@vger.kernel.org
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/namespace.c | 3 +++
- 1 file changed, 3 insertions(+)
-
--- a/fs/smb/client/namespace.c
-+++ b/fs/smb/client/namespace.c
-@@ -146,6 +146,9 @@ static char *automount_fullpath(struct d
- 	}
- 	spin_unlock(&tcon->tc_lock);
- 
-+	if (unlikely(!page))
-+		return ERR_PTR(-ENOMEM);
-+
- 	s = dentry_path_raw(dentry, page, PATH_MAX);
- 	if (IS_ERR(s))
- 		return s;
--- a/debian/patches/patchset-pf/smb/0002-cifs-reset-connections-for-all-channels-when-reconne.patch
+++ b/debian/patches/patchset-pf/smb/0002-cifs-reset-connections-for-all-channels-when-reconne.patch
@@ -1,39 +0,0 @@
-From 0ca6d39b6d40b868eb6b4021f918de7a0f6a0f2e Mon Sep 17 00:00:00 2001
-From: Shyam Prasad N <sprasad@microsoft.com>
-Date: Mon, 2 Jun 2025 22:37:13 +0530
-Subject: cifs: reset connections for all channels when reconnect requested
-
-cifs_reconnect can be called with a flag to mark the session as needing
-reconnect too. When this is done, we expect the connections of all
-channels to be reconnected too, which is not happening today.
-
-Without doing this, we have seen bad things happen when primary and
-secondary channels are connected to different servers (in case of cloud
-services like Azure Files SMB).
-
-This change would force all connections to reconnect as well, not just
-the sessions and tcons.
-
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Shyam Prasad N <sprasad@microsoft.com>
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/connect.c | 7 +++++++
- 1 file changed, 7 insertions(+)
-
--- a/fs/smb/client/connect.c
-+++ b/fs/smb/client/connect.c
-@@ -377,6 +377,13 @@ static int __cifs_reconnect(struct TCP_S
- 	if (!cifs_tcp_ses_needs_reconnect(server, 1))
- 		return 0;
- 
-+	/*
-+	 * if smb session has been marked for reconnect, also reconnect all
-+	 * connections. This way, the other connections do not end up bad.
-+	 */
-+	if (mark_smb_session)
-+		cifs_signal_cifsd_for_reconnect(server, mark_smb_session);
-+
- 	cifs_mark_tcp_ses_conns_for_reconnect(server, mark_smb_session);
- 
- 	cifs_abort_connection(server);
--- a/debian/patches/patchset-pf/smb/0003-cifs-update-dstaddr-whenever-channel-iface-is-update.patch
+++ b/debian/patches/patchset-pf/smb/0003-cifs-update-dstaddr-whenever-channel-iface-is-update.patch
@@ -1,31 +0,0 @@
-From d1f84c6baebc480106c9558dea4842ecb3059017 Mon Sep 17 00:00:00 2001
-From: Shyam Prasad N <sprasad@microsoft.com>
-Date: Mon, 2 Jun 2025 22:37:14 +0530
-Subject: cifs: update dstaddr whenever channel iface is updated
-
-When the server interface info changes (more common in clustered
-servers like Azure Files), the per-channel iface gets updated.
-However, this did not update the corresponding dstaddr. As a result
-these channels will still connect (or try connecting) to older addresses.
-
-Fixes: b54034a73baf ("cifs: during reconnect, update interface if necessary")
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Shyam Prasad N <sprasad@microsoft.com>
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/sess.c | 4 ++++
- 1 file changed, 4 insertions(+)
-
--- a/fs/smb/client/sess.c
-+++ b/fs/smb/client/sess.c
-@@ -445,6 +445,10 @@ cifs_chan_update_iface(struct cifs_ses *
- 
- 	ses->chans[chan_index].iface = iface;
- 	spin_unlock(&ses->chan_lock);
-+
-+	spin_lock(&server->srv_lock);
-+	memcpy(&server->dstaddr, &iface->sockaddr, sizeof(server->dstaddr));
-+	spin_unlock(&server->srv_lock);
- }
- 
- static int
--- a/debian/patches/patchset-pf/smb/0004-cifs-dns-resolution-is-needed-only-for-primary-chann.patch
+++ b/debian/patches/patchset-pf/smb/0004-cifs-dns-resolution-is-needed-only-for-primary-chann.patch
@@ -1,33 +0,0 @@
-From 2bffd71a70fa4695f62712688a720393cc92032b Mon Sep 17 00:00:00 2001
-From: Shyam Prasad N <sprasad@microsoft.com>
-Date: Mon, 2 Jun 2025 22:37:16 +0530
-Subject: cifs: dns resolution is needed only for primary channel
-
-When calling cifs_reconnect, before the connection to the
-server is reestablished, the code today does a DNS resolution and
-updates server->dstaddr.
-
-However, this is not necessary for secondary channels. Secondary
-channels use the interface list returned by the server to decide
-which address to connect to. And that happens after tcon is reconnected
-and server interfaces are requested.
-
-Signed-off-by: Shyam Prasad N <sprasad@microsoft.com>
-Cc: stable@vger.kernel.org
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/connect.c | 3 ++-
- 1 file changed, 2 insertions(+), 1 deletion(-)
-
--- a/fs/smb/client/connect.c
-+++ b/fs/smb/client/connect.c
-@@ -392,7 +392,8 @@ static int __cifs_reconnect(struct TCP_S
- 		try_to_freeze();
- 		cifs_server_lock(server);
- 
-		if (!cifs_swn_set_server_dstaddr(server)) {
-+		if (!cifs_swn_set_server_dstaddr(server) &&
-+		    !SERVER_IS_CHAN(server)) {
- 			/* resolve the hostname again to make sure that IP address is up-to-date */
- 			rc = reconn_set_ipaddr_from_hostname(server);
- 			cifs_dbg(FYI, "%s: reconn_set_ipaddr_from_hostname: rc=%d\n", __func__, rc);
--- a/debian/patches/patchset-pf/smb/0005-cifs-deal-with-the-channel-loading-lag-while-picking.patch
+++ b/debian/patches/patchset-pf/smb/0005-cifs-deal-with-the-channel-loading-lag-while-picking.patch
@@ -1,73 +0,0 @@
-From 918f494c058028cee8bdff33a4aa613377da61f0 Mon Sep 17 00:00:00 2001
-From: Shyam Prasad N <sprasad@microsoft.com>
-Date: Mon, 2 Jun 2025 22:37:12 +0530
-Subject: cifs: deal with the channel loading lag while picking channels
-
-Our current approach to select a channel for sending requests is this:
-1. iterate all channels to find the min and max queue depth
-2. if min and max are not the same, pick the channel with min depth
-3. if min and max are same, round robin, as all channels are equally loaded
-
-The problem with this approach is that there's a lag between selecting
-a channel and sending the request (that increases the queue depth on the channel).
-While these numbers will eventually catch up, there could be a skew in the
-channel usage, depending on the application's I/O parallelism and the server's
-speed of handling requests.
-
-With sufficient parallelism, this lag can artificially increase the queue depth,
-thereby impacting the performance negatively.
-
-This change will change the step 1 above to start the iteration from the last
-selected channel. This is to reduce the skew in channel usage even in the presence
-of this lag.
-
-Fixes: ea90708d3cf3 ("cifs: use the least loaded channel for sending requests")
-Cc: <stable@vger.kernel.org>
-Signed-off-by: Shyam Prasad N <sprasad@microsoft.com>
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/transport.c | 14 +++++++-------
- 1 file changed, 7 insertions(+), 7 deletions(-)
-
--- a/fs/smb/client/transport.c
-+++ b/fs/smb/client/transport.c
-@@ -1018,14 +1018,16 @@ struct TCP_Server_Info *cifs_pick_channe
- 	uint index = 0;
- 	unsigned int min_in_flight = UINT_MAX, max_in_flight = 0;
- 	struct TCP_Server_Info *server = NULL;
-	int i;
-+	int i, start, cur;
- 
- 	if (!ses)
- 		return NULL;
- 
- 	spin_lock(&ses->chan_lock);
-+	start = atomic_inc_return(&ses->chan_seq);
- 	for (i = 0; i < ses->chan_count; i++) {
-		server = ses->chans[i].server;
-+		cur = (start + i) % ses->chan_count;
-+		server = ses->chans[cur].server;
- 		if (!server || server->terminate)
- 			continue;
- 
-@@ -1042,17 +1044,15 @@ struct TCP_Server_Info *cifs_pick_channe
- 		 */
- 		if (server->in_flight < min_in_flight) {
- 			min_in_flight = server->in_flight;
-			index = i;
-+			index = cur;
- 		}
- 		if (server->in_flight > max_in_flight)
- 			max_in_flight = server->in_flight;
- 	}
- 
- 	/* if all channels are equally loaded, fall back to round-robin */
-	if (min_in_flight == max_in_flight) {
-		index = (uint)atomic_inc_return(&ses->chan_seq);
-		index %= ses->chan_count;
-	}
-+	if (min_in_flight == max_in_flight)
-+		index = (uint)start % ses->chan_count;
- 
- 	server = ses->chans[index].server;
- 	spin_unlock(&ses->chan_lock);
--- a/debian/patches/patchset-pf/smb/0006-cifs-serialize-other-channels-when-query-server-inte.patch
+++ b/debian/patches/patchset-pf/smb/0006-cifs-serialize-other-channels-when-query-server-inte.patch
@@ -1,82 +0,0 @@
-From 2cc6528030c91406031698e047896faa99fc0092 Mon Sep 17 00:00:00 2001
-From: Shyam Prasad N <sprasad@microsoft.com>
-Date: Mon, 2 Jun 2025 22:37:15 +0530
-Subject: cifs: serialize other channels when query server interfaces is
- pending
-
-Today, during smb2_reconnect, session_mutex is released as soon as
-the tcon is reconnected and is in a good state. However, in case
-multichannel is enabled, there is also a query of server interfaces that
-follows. We've seen that this query can race with reconnects of other
-channels, causing them to step on each other with reconnects.
-
-This change extends the hold of session_mutex till after the query of
-server interfaces is complete. In order to avoid recursive smb2_reconnect
-checks during query ioctl, this change also introduces a session flag
-for sessions where such a query is in progress.
-
-Signed-off-by: Shyam Prasad N <sprasad@microsoft.com>
-Cc: stable@vger.kernel.org
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/cifsglob.h |  1 +
- fs/smb/client/smb2pdu.c  | 24 ++++++++++++++++++------
- 2 files changed, 19 insertions(+), 6 deletions(-)
-
--- a/fs/smb/client/cifsglob.h
-+++ b/fs/smb/client/cifsglob.h
-@@ -1084,6 +1084,7 @@ struct cifs_chan {
- };
- 
- #define CIFS_SES_FLAG_SCALE_CHANNELS (0x1)
-+#define CIFS_SES_FLAGS_PENDING_QUERY_INTERFACES (0x2)
- 
- /*
-  * Session structure.  One of these for each uid session with a particular host
--- a/fs/smb/client/smb2pdu.c
-+++ b/fs/smb/client/smb2pdu.c
-@@ -411,14 +411,19 @@ skip_sess_setup:
- 	if (!rc &&
- 	    (server->capabilities & SMB2_GLOBAL_CAP_MULTI_CHANNEL) &&
- 	    server->ops->query_server_interfaces) {
-		mutex_unlock(&ses->session_mutex);
-
- 		/*
-		 * query server network interfaces, in case they change
-+		 * query server network interfaces, in case they change.
-+		 * Also mark the session as pending this update while the query
-+		 * is in progress. This will be used to avoid calling
-+		 * smb2_reconnect recursively.
- 		 */
-+		ses->flags |= CIFS_SES_FLAGS_PENDING_QUERY_INTERFACES;
- 		xid = get_xid();
- 		rc = server->ops->query_server_interfaces(xid, tcon, false);
- 		free_xid(xid);
-+		ses->flags &= ~CIFS_SES_FLAGS_PENDING_QUERY_INTERFACES;
-+
-+		mutex_unlock(&ses->session_mutex);
- 
- 		if (rc == -EOPNOTSUPP && ses->chan_count > 1) {
- 			/*
-@@ -560,11 +565,18 @@ static int smb2_ioctl_req_init(u32 opcod
- 			       struct TCP_Server_Info *server,
- 			       void **request_buf, unsigned int *total_len)
- {
-	/* Skip reconnect only for FSCTL_VALIDATE_NEGOTIATE_INFO IOCTLs */
-	if (opcode == FSCTL_VALIDATE_NEGOTIATE_INFO) {
-+	/*
-+	 * Skip reconnect in one of the following cases:
-+	 * 1. For FSCTL_VALIDATE_NEGOTIATE_INFO IOCTLs
-+	 * 2. For FSCTL_QUERY_NETWORK_INTERFACE_INFO IOCTL when called from
-+	 * smb2_reconnect (indicated by CIFS_SES_FLAG_SCALE_CHANNELS ses flag)
-+	 */
-+	if (opcode == FSCTL_VALIDATE_NEGOTIATE_INFO ||
-+	    (opcode == FSCTL_QUERY_NETWORK_INTERFACE_INFO &&
-+	     (tcon->ses->flags & CIFS_SES_FLAGS_PENDING_QUERY_INTERFACES)))
- 		return __smb2_plain_req_init(SMB2_IOCTL, tcon, server,
- 					     request_buf, total_len);
-	}
-+
- 	return smb2_plain_req_init(SMB2_IOCTL, tcon, server,
- 				   request_buf, total_len);
- }
--- a/debian/patches/patchset-pf/smb/0007-cifs-do-not-disable-interface-polling-on-failure.patch
+++ b/debian/patches/patchset-pf/smb/0007-cifs-do-not-disable-interface-polling-on-failure.patch
@@ -1,64 +0,0 @@
-From 48fd713e7c35aba7a4c3ed327977897909575e3e Mon Sep 17 00:00:00 2001
-From: Shyam Prasad N <sprasad@microsoft.com>
-Date: Mon, 2 Jun 2025 22:37:17 +0530
-Subject: cifs: do not disable interface polling on failure
-
-When a server has multichannel enabled, we keep polling the server
-for interfaces periodically. However, when this query fails, we
-disable the polling. This can be problematic as it takes away the
-chance for the server to start advertizing again.
-
-This change reschedules the delayed work, even if the current call
-failed. That way, multichannel sessions can recover.
-
-Signed-off-by: Shyam Prasad N <sprasad@microsoft.com>
-Cc: stable@vger.kernel.org
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/connect.c | 6 +-----
- fs/smb/client/smb2pdu.c | 9 +++++----
- 2 files changed, 6 insertions(+), 9 deletions(-)
-
--- a/fs/smb/client/connect.c
-+++ b/fs/smb/client/connect.c
-@@ -116,13 +116,9 @@ static void smb2_query_server_interfaces
- 	rc = server->ops->query_server_interfaces(xid, tcon, false);
- 	free_xid(xid);
- 
-	if (rc) {
-		if (rc == -EOPNOTSUPP)
-			return;
-
-+	if (rc)
- 		cifs_dbg(FYI, "%s: failed to query server interfaces: %d\n",
- 				__func__, rc);
-	}
- 
- 	queue_delayed_work(cifsiod_wq, &tcon->query_interfaces,
- 			   (SMB_INTERFACE_POLL_INTERVAL * HZ));
--- a/fs/smb/client/smb2pdu.c
-+++ b/fs/smb/client/smb2pdu.c
-@@ -423,6 +423,10 @@ skip_sess_setup:
- 		free_xid(xid);
- 		ses->flags &= ~CIFS_SES_FLAGS_PENDING_QUERY_INTERFACES;
- 
-+		/* regardless of rc value, setup polling */
-+		queue_delayed_work(cifsiod_wq, &tcon->query_interfaces,
-+				   (SMB_INTERFACE_POLL_INTERVAL * HZ));
-+
- 		mutex_unlock(&ses->session_mutex);
- 
- 		if (rc == -EOPNOTSUPP && ses->chan_count > 1) {
-@@ -443,11 +447,8 @@ skip_sess_setup:
- 		if (ses->chan_max > ses->chan_count &&
- 		    ses->iface_count &&
- 		    !SERVER_IS_CHAN(server)) {
-			if (ses->chan_count == 1) {
-+			if (ses->chan_count == 1)
- 				cifs_server_dbg(VFS, "supports multichannel now\n");
-				queue_delayed_work(cifsiod_wq, &tcon->query_interfaces,
-						 (SMB_INTERFACE_POLL_INTERVAL * HZ));
-			}
- 
- 			cifs_try_adding_channels(ses);
- 		}
--- a/debian/patches/patchset-pf/smb/0008-smb-improve-directory-cache-reuse-for-readdir-operat.patch
+++ b/debian/patches/patchset-pf/smb/0008-smb-improve-directory-cache-reuse-for-readdir-operat.patch
@@ -1,148 +0,0 @@
-From 17457c5d0fa0b98cef9d2236a1518b1ded25fa5d Mon Sep 17 00:00:00 2001
-From: Bharath SM <bharathsm.hsk@gmail.com>
-Date: Wed, 11 Jun 2025 16:59:02 +0530
-Subject: smb: improve directory cache reuse for readdir operations
-
-Currently, cached directory contents were not reused across subsequent
-'ls' operations because the cache validity check relied on comparing
-the ctx pointer, which changes with each readdir invocation. As a
-result, the cached dir entries was not marked as valid and the cache was
-not utilized for subsequent 'ls' operations.
-
-This change uses the file pointer, which remains consistent across all
-readdir calls for a given directory instance, to associate and validate
-the cache. As a result, cached directory contents can now be
-correctly reused, improving performance for repeated directory listings.
-
-Performance gains with local windows SMB server:
-
-Without the patch and default actimeo=1:
- 1000 directory enumeration operations on dir with 10k files took 135.0s
-
-With this patch and actimeo=0:
- 1000 directory enumeration operations on dir with 10k files took just 5.1s
-
-Signed-off-by: Bharath SM <bharathsm@microsoft.com>
-Reviewed-by: Shyam Prasad N <sprasad@microsoft.com>
-Cc: stable@vger.kernel.org
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/client/cached_dir.h |  8 ++++----
- fs/smb/client/readdir.c    | 28 +++++++++++++++-------------
- 2 files changed, 19 insertions(+), 17 deletions(-)
-
--- a/fs/smb/client/cached_dir.h
-+++ b/fs/smb/client/cached_dir.h
-@@ -21,10 +21,10 @@ struct cached_dirent {
- struct cached_dirents {
- 	bool is_valid:1;
- 	bool is_failed:1;
-	struct dir_context *ctx; /*
-				  * Only used to make sure we only take entries
-				  * from a single context. Never dereferenced.
-				  */
-+	struct file *file; /*
-+			    * Used to associate the cache with a single
-+			    * open file instance.
-+			    */
- 	struct mutex de_mutex;
- 	int pos;		 /* Expected ctx->pos */
- 	struct list_head entries;
--- a/fs/smb/client/readdir.c
-+++ b/fs/smb/client/readdir.c
-@@ -850,9 +850,9 @@ static bool emit_cached_dirents(struct c
- }
- 
- static void update_cached_dirents_count(struct cached_dirents *cde,
-					struct dir_context *ctx)
-+					struct file *file)
- {
-	if (cde->ctx != ctx)
-+	if (cde->file != file)
- 		return;
- 	if (cde->is_valid || cde->is_failed)
- 		return;
-@@ -861,9 +861,9 @@ static void update_cached_dirents_count(
- }
- 
- static void finished_cached_dirents_count(struct cached_dirents *cde,
-					struct dir_context *ctx)
-+					struct dir_context *ctx, struct file *file)
- {
-	if (cde->ctx != ctx)
-+	if (cde->file != file)
- 		return;
- 	if (cde->is_valid || cde->is_failed)
- 		return;
-@@ -876,11 +876,12 @@ static void finished_cached_dirents_coun
- static void add_cached_dirent(struct cached_dirents *cde,
- 			      struct dir_context *ctx,
- 			      const char *name, int namelen,
-			      struct cifs_fattr *fattr)
-+			      struct cifs_fattr *fattr,
-+				  struct file *file)
- {
- 	struct cached_dirent *de;
- 
-	if (cde->ctx != ctx)
-+	if (cde->file != file)
- 		return;
- 	if (cde->is_valid || cde->is_failed)
- 		return;
-@@ -910,7 +911,8 @@ static void add_cached_dirent(struct cac
- static bool cifs_dir_emit(struct dir_context *ctx,
- 			  const char *name, int namelen,
- 			  struct cifs_fattr *fattr,
-			  struct cached_fid *cfid)
-+			  struct cached_fid *cfid,
-+			  struct file *file)
- {
- 	bool rc;
- 	ino_t ino = cifs_uniqueid_to_ino_t(fattr->cf_uniqueid);
-@@ -922,7 +924,7 @@ static bool cifs_dir_emit(struct dir_con
- 	if (cfid) {
- 		mutex_lock(&cfid->dirents.de_mutex);
- 		add_cached_dirent(&cfid->dirents, ctx, name, namelen,
-				  fattr);
-+				  fattr, file);
- 		mutex_unlock(&cfid->dirents.de_mutex);
- 	}
- 
-@@ -1022,7 +1024,7 @@ static int cifs_filldir(char *find_entry
- 	cifs_prime_dcache(file_dentry(file), &name, &fattr);
- 
- 	return !cifs_dir_emit(ctx, name.name, name.len,
-			      &fattr, cfid);
-+			      &fattr, cfid, file);
- }
- 
- 
-@@ -1073,8 +1075,8 @@ int cifs_readdir(struct file *file, stru
- 	 * we need to initialize scanning and storing the
- 	 * directory content.
- 	 */
-	if (ctx->pos == 0 && cfid->dirents.ctx == NULL) {
-		cfid->dirents.ctx = ctx;
-+	if (ctx->pos == 0 && cfid->dirents.file == NULL) {
-+		cfid->dirents.file = file;
- 		cfid->dirents.pos = 2;
- 	}
- 	/*
-@@ -1142,7 +1144,7 @@ int cifs_readdir(struct file *file, stru
- 	} else {
- 		if (cfid) {
- 			mutex_lock(&cfid->dirents.de_mutex);
-			finished_cached_dirents_count(&cfid->dirents, ctx);
-+			finished_cached_dirents_count(&cfid->dirents, ctx, file);
- 			mutex_unlock(&cfid->dirents.de_mutex);
- 		}
- 		cifs_dbg(FYI, "Could not find entry\n");
-@@ -1183,7 +1185,7 @@ int cifs_readdir(struct file *file, stru
- 		ctx->pos++;
- 		if (cfid) {
- 			mutex_lock(&cfid->dirents.de_mutex);
-			update_cached_dirents_count(&cfid->dirents, ctx);
-+			update_cached_dirents_count(&cfid->dirents, file);
- 			mutex_unlock(&cfid->dirents.de_mutex);
- 		}
- 
--- a/debian/patches/patchset-pf/smb/0009-ksmbd-fix-null-pointer-dereference-in-destroy_previo.patch
+++ b/debian/patches/patchset-pf/smb/0009-ksmbd-fix-null-pointer-dereference-in-destroy_previo.patch
@@ -1,45 +0,0 @@
-From 9d330e139e9993f2489fcfe3048c8e737085646d Mon Sep 17 00:00:00 2001
-From: Namjae Jeon <linkinjeon@kernel.org>
-Date: Fri, 13 Jun 2025 10:12:43 +0900
-Subject: ksmbd: fix null pointer dereference in destroy_previous_session
-
-If client set ->PreviousSessionId on kerberos session setup stage,
-NULL pointer dereference error will happen. Since sess->user is not
-set yet, It can pass the user argument as NULL to destroy_previous_session.
-sess->user will be set in ksmbd_krb5_authenticate(). So this patch move
-calling destroy_previous_session() after ksmbd_krb5_authenticate().
-
-Cc: stable@vger.kernel.org
-Reported-by: zdi-disclosures@trendmicro.com # ZDI-CAN-27391
-Signed-off-by: Namjae Jeon <linkinjeon@kernel.org>
-Signed-off-by: Steve French <stfrench@microsoft.com>
---
- fs/smb/server/smb2pdu.c | 11 ++++++-----
- 1 file changed, 6 insertions(+), 5 deletions(-)
-
--- a/fs/smb/server/smb2pdu.c
-+++ b/fs/smb/server/smb2pdu.c
-@@ -1607,17 +1607,18 @@ static int krb5_authenticate(struct ksmb
- 	out_len = work->response_sz -
- 		(le16_to_cpu(rsp->SecurityBufferOffset) + 4);
- 
-	/* Check previous session */
-	prev_sess_id = le64_to_cpu(req->PreviousSessionId);
-	if (prev_sess_id && prev_sess_id != sess->id)
-		destroy_previous_session(conn, sess->user, prev_sess_id);
-
- 	retval = ksmbd_krb5_authenticate(sess, in_blob, in_len,
- 					 out_blob, &out_len);
- 	if (retval) {
- 		ksmbd_debug(SMB, "krb5 authentication failed\n");
- 		return -EINVAL;
- 	}
-+
-+	/* Check previous session */
-+	prev_sess_id = le64_to_cpu(req->PreviousSessionId);
-+	if (prev_sess_id && prev_sess_id != sess->id)
-+		destroy_previous_session(conn, sess->user, prev_sess_id);
-+
- 	rsp->SecurityBufferLength = cpu_to_le16(out_len);
- 
- 	if ((conn->sign || server_conf.enforced_signing) ||
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0001-net-tcp_bbr-broaden-app-limited-rate-sample-detectio.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0001-net-tcp_bbr-broaden-app-limited-rate-sample-detectio.patch
@@ -32,7 +32,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>

 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -3994,6 +3994,7 @@ static int tcp_ack(struct sock *sk, cons
+@@ -4003,6 +4003,7 @@ static int tcp_ack(struct sock *sk, cons
 
 	prior_fack = tcp_is_sack(tp) ? tcp_highest_sack_seq(tp) : tp->snd_una;
 	rs.prior_in_flight = tcp_packets_in_flight(tp);
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0005-net-tcp_bbr-v2-export-FLAG_ECE-in-rate_sample.is_ece.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0005-net-tcp_bbr-v2-export-FLAG_ECE-in-rate_sample.is_ece.patch
@@ -28,7 +28,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 struct tcp_congestion_ops {
 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -4084,6 +4084,7 @@ static int tcp_ack(struct sock *sk, cons
+@@ -4093,6 +4093,7 @@ static int tcp_ack(struct sock *sk, cons
 	delivered = tcp_newly_delivered(sk, delivered, flag);
 	lost = tp->lost - lost;			/* freshly marked lost */
 	rs.is_ack_delayed = !!(flag & FLAG_ACK_MAYBE_DELAYED);
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0006-net-tcp_bbr-v2-introduce-ca_ops-skb_marked_lost-CC-m.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0006-net-tcp_bbr-v2-introduce-ca_ops-skb_marked_lost-CC-m.patch
@@ -42,7 +42,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 	 */
 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -1139,7 +1139,12 @@ static void tcp_verify_retransmit_hint(s
+@@ -1135,7 +1135,12 @@ static void tcp_verify_retransmit_hint(s
  */
 static void tcp_notify_skb_loss_event(struct tcp_sock *tp, const struct sk_buff *skb)
 {
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0007-net-tcp_bbr-v2-adjust-skb-tx.in_flight-upon-merge-in.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0007-net-tcp_bbr-v2-adjust-skb-tx.in_flight-upon-merge-in.patch
@@ -39,7 +39,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>

 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -1516,6 +1516,17 @@ static bool tcp_shifted_skb(struct sock
+@@ -1512,6 +1512,17 @@ static bool tcp_shifted_skb(struct sock
 	WARN_ON_ONCE(tcp_skb_pcount(skb) < pcount);
 	tcp_skb_pcount_add(skb, -pcount);
 
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0011-net-tcp-add-fast_ack_mode-1-skip-rwin-check-in-tcp_f.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0011-net-tcp-add-fast_ack_mode-1-skip-rwin-check-in-tcp_f.patch
@@ -54,7 +54,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 	if (tcp_ca_needs_ecn(sk))
 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -5800,13 +5800,14 @@ static void __tcp_ack_snd_check(struct s
+@@ -5809,13 +5809,14 @@ static void __tcp_ack_snd_check(struct s
 
 	    /* More than one full frame received... */
 	if (((tp->rcv_nxt - tp->rcv_wup) > inet_csk(sk)->icsk_ack.rcv_mss &&
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0013-net-tcp_bbr-v2-inform-CC-module-of-losses-repaired-b.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0013-net-tcp_bbr-v2-inform-CC-module-of-losses-repaired-b.patch
@@ -35,7 +35,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 /* Information about inbound ACK, passed to cong_ops->in_ack_event() */
 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -3881,6 +3881,7 @@ static void tcp_process_tlp_ack(struct s
+@@ -3890,6 +3890,7 @@ static void tcp_process_tlp_ack(struct s
 		/* ACK advances: there was a loss, so reduce cwnd. Reset
 		 * tlp_high_seq in tcp_init_cwnd_reduction()
 		 */
--- a/debian/patches/patchset-xanmod/net/tcp/bbr3/0014-net-tcp_bbr-v2-introduce-is_acking_tlp_retrans_seq-i.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/bbr3/0014-net-tcp_bbr-v2-introduce-is_acking_tlp_retrans_seq-i.patch
@@ -31,7 +31,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 };
 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -3864,7 +3864,8 @@ static int tcp_replace_ts_recent(struct
+@@ -3873,7 +3873,8 @@ static int tcp_replace_ts_recent(struct
 /* This routine deals with acks during a TLP episode and ends an episode by
  * resetting tlp_high_seq. Ref: TLP algorithm in draft-ietf-tcpm-rack
  */
@@ -41,7 +41,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 {
 	struct tcp_sock *tp = tcp_sk(sk);
 
-@@ -3892,6 +3893,11 @@ static void tcp_process_tlp_ack(struct s
+@@ -3901,6 +3902,11 @@ static void tcp_process_tlp_ack(struct s
 			     FLAG_NOT_DUP | FLAG_DATA_SACKED))) {
 		/* Pure dupack: original and TLP probe arrived; no loss */
 		tp->tlp_high_seq = 0;
@@ -53,7 +53,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 	}
 }
 
-@@ -4077,7 +4083,7 @@ static int tcp_ack(struct sock *sk, cons
+@@ -4086,7 +4092,7 @@ static int tcp_ack(struct sock *sk, cons
 	tcp_in_ack_event(sk, flag);
 
 	if (tp->tlp_high_seq)
@@ -62,7 +62,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 
 	if (tcp_ack_is_dubious(sk, flag)) {
 		if (!(flag & (FLAG_SND_UNA_ADVANCED |
-@@ -4122,7 +4128,7 @@ no_queue:
+@@ -4131,7 +4137,7 @@ no_queue:
 	tcp_ack_probe(sk);
 
 	if (tp->tlp_high_seq)
--- a/debian/patches/patchset-xanmod/net/tcp/cloudflare/0001-tcp-Add-a-sysctl-to-skip-tcp-collapse-processing-whe.patch
+++ b/debian/patches/patchset-xanmod/net/tcp/cloudflare/0001-tcp-Add-a-sysctl-to-skip-tcp-collapse-processing-whe.patch
@@ -83,7 +83,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 		.maxlen		= sizeof(u8),
 --- a/net/ipv4/tcp_input.c
 +++ b/net/ipv4/tcp_input.c
-@@ -5682,6 +5682,7 @@ static bool tcp_prune_ofo_queue(struct s
+@@ -5691,6 +5691,7 @@ static bool tcp_prune_ofo_queue(struct s
 static int tcp_prune_queue(struct sock *sk, const struct sk_buff *in_skb)
 {
 	struct tcp_sock *tp = tcp_sk(sk);
@@ -91,7 +91,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 
 	NET_INC_STATS(sock_net(sk), LINUX_MIB_PRUNECALLED);
 
-@@ -5693,6 +5694,39 @@ static int tcp_prune_queue(struct sock *
+@@ -5702,6 +5703,39 @@ static int tcp_prune_queue(struct sock *
 	if (atomic_read(&sk->sk_rmem_alloc) <= sk->sk_rcvbuf)
 		return 0;
 
@@ -131,7 +131,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 	tcp_collapse_ofo_queue(sk);
 	if (!skb_queue_empty(&sk->sk_receive_queue))
 		tcp_collapse(sk, &sk->sk_receive_queue, NULL,
-@@ -5711,6 +5745,8 @@ static int tcp_prune_queue(struct sock *
+@@ -5720,6 +5754,8 @@ static int tcp_prune_queue(struct sock *
 	if (atomic_read(&sk->sk_rmem_alloc) <= sk->sk_rcvbuf)
 		return 0;
 
--- a/debian/patches/patchset-xanmod/pci_acso/0001-PCI-Enable-overrides-for-missing-ACS-capabilities.patch
+++ b/debian/patches/patchset-xanmod/pci_acso/0001-PCI-Enable-overrides-for-missing-ACS-capabilities.patch
@@ -180,7 +180,7 @@ Signed-off-by: Alexandre Frade <kernel@xanmod.org>
 /*
  * Some NVIDIA GPU devices do not work with bus reset, SBR needs to be
  * prevented for those affected devices.
-@@ -5171,6 +5271,8 @@ static const struct pci_dev_acs_enabled
+@@ -5194,6 +5294,8 @@ static const struct pci_dev_acs_enabled
 	{ PCI_VENDOR_ID_ZHAOXIN, PCI_ANY_ID, pci_quirk_zhaoxin_pcie_ports_acs },
 	/* Wangxun nics */
 	{ PCI_VENDOR_ID_WANGXUN, PCI_ANY_ID, pci_quirk_wangxun_nic_acs },
--- a/debian/patches/patchset-zen/sauce/0002-ZEN-PCI-Add-Intel-remapped-NVMe-device-support.patch
+++ b/debian/patches/patchset-zen/sauce/0002-ZEN-PCI-Add-Intel-remapped-NVMe-device-support.patch
@@ -94,7 +94,7 @@ Contains:
 -#endif
 --- a/drivers/ata/ahci.c
 +++ b/drivers/ata/ahci.c
-@@ -1629,7 +1629,7 @@ static irqreturn_t ahci_thunderx_irq_han
+@@ -1662,7 +1662,7 @@ static irqreturn_t ahci_thunderx_irq_han
 }
 #endif
 
@@ -103,7 +103,7 @@ Contains:
 		struct ahci_host_priv *hpriv)
 {
 	int i;
-@@ -1642,7 +1642,7 @@ static void ahci_remap_check(struct pci_
+@@ -1675,7 +1675,7 @@ static void ahci_remap_check(struct pci_
 	    pci_resource_len(pdev, bar) < SZ_512K ||
 	    bar != AHCI_PCI_BAR_STANDARD ||
 	    !(readl(hpriv->mmio + AHCI_VSCAP) & 1))
@@ -112,7 +112,7 @@ Contains:
 
 	cap = readq(hpriv->mmio + AHCI_REMAP_CAP);
 	for (i = 0; i < AHCI_MAX_REMAP; i++) {
-@@ -1657,18 +1657,11 @@ static void ahci_remap_check(struct pci_
+@@ -1690,18 +1690,11 @@ static void ahci_remap_check(struct pci_
 	}
 
 	if (!hpriv->remapped_nvme)
@@ -135,7 +135,7 @@ Contains:
 }
 
 static int ahci_get_irq_vector(struct ata_host *host, int port)
-@@ -1912,7 +1905,9 @@ static int ahci_init_one(struct pci_dev
+@@ -1945,7 +1938,9 @@ static int ahci_init_one(struct pci_dev
 		return -ENOMEM;
 
 	/* detect remapped nvme devices */
--- a/debian/patches/series
+++ b/debian/patches/series
@@ -129,9 +129,8 @@ misc-openwrt/0005-mac80211-minstrel_ht-reduce-fluctuations-in-rate-pro.patch
 misc-openwrt/0006-mac80211-minstrel_ht-rework-rate-downgrade-code-and-.patch
 misc-openwrt/0007-mac80211-increase-quantum-for-airtime-scheduler.patch
 misc-openwrt/0008-mac80211-add-AQL-support-for-broadcast-packets.patch
-misc-openwrt/0009-mac80211-revert-dynamically-set-codel-parameters-per-station.patch
-misc-openwrt/0010-mac80211-txq-tune.patch
-misc-openwrt/0011-cfg80211-aql-txq-limit.patch
+misc-openwrt/0009-mac80211-txq-tune.patch
+misc-openwrt/0010-cfg80211-aql-txq-limit.patch
 misc-openwrt/0101-sched-sch_cake-fix-bulk-flow-accounting-logic-for-host.patch
 misc-openwrt/0201-fq-adjust-memory-size.patch

@@ -140,26 +139,6 @@ patchset-pf/cpuidle/0001-cpuidle-Prefer-teo-over-menu-governor.patch
 patchset-pf/kbuild/0001-ice-mark-ice_write_prof_mask_reg-as-noinline.patch
 patchset-pf/kbuild/0002-wifi-mac80211-mark-copy_mesh_setup-as-noinline.patch

-patchset-pf/nfs/0001-NFSD-unregister-filesystem-in-case-genl_register_fam.patch
-patchset-pf/nfs/0002-NFSD-fix-race-between-nfsd-registration-and-exports_.patch
-patchset-pf/nfs/0003-nfsd-fix-access-checking-for-NLM-under-XPRTSEC-polic.patch
-patchset-pf/nfs/0004-nfsd-nfsd4_spo_must_allow-must-check-this-is-a-v4-co.patch
-patchset-pf/nfs/0005-nfsd-Initialize-ssc-before-laundromat_work-to-preven.patch
-patchset-pf/nfs/0006-NFSD-Implement-FATTR4_CLONE_BLKSIZE-attribute.patch
-patchset-pf/nfs/0007-fs-nfs-read-fix-double-unlock-bug-in-nfs_return_empt.patch
-patchset-pf/nfs/0008-NFSv4-Don-t-check-for-OPEN-feature-support-in-v4.1.patch
-patchset-pf/nfs/0009-NFS-always-probe-for-LOCALIO-support-asynchronously.patch
-
-patchset-pf/smb/0001-smb-client-add-NULL-check-in-automount_fullpath.patch
-patchset-pf/smb/0002-cifs-reset-connections-for-all-channels-when-reconne.patch
-patchset-pf/smb/0003-cifs-update-dstaddr-whenever-channel-iface-is-update.patch
-patchset-pf/smb/0004-cifs-dns-resolution-is-needed-only-for-primary-chann.patch
-patchset-pf/smb/0005-cifs-deal-with-the-channel-loading-lag-while-picking.patch
-patchset-pf/smb/0006-cifs-serialize-other-channels-when-query-server-inte.patch
-patchset-pf/smb/0007-cifs-do-not-disable-interface-polling-on-failure.patch
-patchset-pf/smb/0008-smb-improve-directory-cache-reuse-for-readdir-operat.patch
-patchset-pf/smb/0009-ksmbd-fix-null-pointer-dereference-in-destroy_previo.patch
-
 patchset-xanmod/binder/0001-binder-turn-into-module.patch

 patchset-xanmod/clearlinux/0001-sched-wait-Do-accept-in-LIFO-order-for-cache-efficie.patch
@@ -241,50 +220,16 @@ patchset-zen/sauce/0020-ZEN-INTERACTIVE-dm-crypt-Disable-workqueues-for-cryp.pat
 patchset-zen/sauce/0021-ZEN-INTERACTIVE-mm-swap-Disable-swap-in-readahead.patch
 patchset-zen/sauce/0022-ZEN-INTERACTIVE-Document-PDS-BMQ-configuration.patch

-patchset-pf/fixes/0001-mm-fix-ratelimit_pages-update-error-in-dirty_ratio_h.patch
-patchset-pf/fixes/0002-vgacon-Add-check-for-vc_origin-address-range-in-vgac.patch
-patchset-pf/fixes/0003-fbdev-Fix-do_register_framebuffer-to-prevent-null-pt.patch
-patchset-pf/fixes/0004-fbdev-Fix-fb_set_var-to-prevent-null-ptr-deref-in-fb.patch
-patchset-pf/fixes/0005-anon_inode-use-a-proper-mode-internally.patch
-patchset-pf/fixes/0006-anon_inode-explicitly-block-setattr.patch
-patchset-pf/fixes/0007-anon_inode-raise-SB_I_NODEV-and-SB_I_NOEXEC.patch
-patchset-pf/fixes/0008-fs-add-S_ANON_INODE.patch
-patchset-pf/fixes/0009-configfs-Do-not-override-creating-attribute-file-fai.patch
-patchset-pf/fixes/0010-Revert-Disable-FOP_DONTCACHE-for-now-due-to-bugs.patch
-patchset-pf/fixes/0011-mm-filemap-unify-read-write-dropbehind-naming.patch
-patchset-pf/fixes/0012-mm-filemap-unify-dropbehind-flag-testing-and-clearin.patch
-patchset-pf/fixes/0013-mm-khugepaged-fix-race-with-folio-split-free-using-t.patch
-patchset-pf/fixes/0014-mm-add-folio_expected_ref_count-for-reference-count-.patch
-patchset-pf/fixes/0015-mm-fix-uprobe-pte-be-overwritten-when-expanding-vma.patch
-patchset-pf/fixes/0016-mm-hugetlb-unshare-page-tables-during-VMA-split-not-.patch
-patchset-pf/fixes/0017-mm-hugetlb-fix-huge_pmd_unshare-vs-GUP-fast-race.patch
-patchset-pf/fixes/0018-mm-madvise-handle-madvise_lock-failure-during-race-u.patch
-patchset-pf/fixes/0019-video-screen_info-Relocate-framebuffers-behind-PCI-b.patch
-patchset-pf/fixes/0020-sysfb-Fix-screen_info-type-check-for-VGA.patch
-patchset-pf/fixes/0021-watchdog-fix-watchdog-may-detect-false-positive-of-s.patch
-patchset-pf/fixes/0022-sched-rt-Fix-race-in-push_rt_task.patch
-patchset-pf/fixes/0023-sched-fair-Adhere-to-place_entity-constraints.patch
-patchset-pf/fixes/0024-alloc_tag-handle-module-codetag-load-errors-as-modul.patch
-patchset-pf/fixes/0025-svcrdma-Unregister-the-device-if-svc_rdma_accept-fai.patch
-patchset-pf/fixes/0026-SUNRPC-Prevent-hang-on-NFS-mount-with-xprtsec-m-tls.patch
-patchset-pf/fixes/0027-hv_netvsc-fix-potential-deadlock-in-netvsc_vf_setxdp.patch
-patchset-pf/fixes/0028-net-clear-the-dst-when-changing-skb-protocol.patch
-patchset-pf/fixes/0029-net_sched-sch_sfq-reject-invalid-perturb-period.patch
-patchset-pf/fixes/0030-mm-vma-reset-VMA-iterator-on-commit_merge-OOM-failur.patch
-patchset-pf/fixes/0031-mm-close-theoretical-race-where-stale-TLB-entries-co.patch
-patchset-pf/fixes/0032-io_uring-kbuf-don-t-truncate-end-buffer-for-multiple.patch
-patchset-pf/fixes/0033-nvme-always-punt-polled-uring_cmd-end_io-work-to-tas.patch
-patchset-pf/fixes/0034-block-Clear-BIO_EMULATES_ZONE_APPEND-flag-on-BIO-com.patch
-patchset-pf/fixes/0035-block-use-plug-request-list-tail-for-one-shot-backme.patch
-patchset-pf/fixes/0036-Revert-mm-execmem-Unify-early-execmem_cache-behaviou.patch
-patchset-pf/fixes/0037-x86-virt-tdx-Avoid-indirect-calls-to-TDX-assembly-fu.patch
-patchset-pf/fixes/0038-x86-mm-pat-don-t-collapse-pages-without-PSE-set.patch
-patchset-pf/fixes/0039-x86-Kconfig-only-enable-ROX-cache-in-execmem-when-ST.patch
-patchset-pf/fixes/0040-x86-its-move-its_pages-array-to-struct-mod_arch_spec.patch
-patchset-pf/fixes/0041-x86-its-explicitly-manage-permissions-for-ITS-pages.patch
-patchset-pf/fixes/0042-KVM-SVM-Clear-current_vmcb-during-vCPU-free-for-all-.patch
-patchset-pf/fixes/0043-KVM-VMX-Flush-shadow-VMCS-on-emergency-reboot.patch
+patchset-pf/fixes/0001-Revert-Disable-FOP_DONTCACHE-for-now-due-to-bugs.patch
+patchset-pf/fixes/0002-mm-filemap-unify-read-write-dropbehind-naming.patch
+patchset-pf/fixes/0003-mm-filemap-unify-dropbehind-flag-testing-and-clearin.patch
+patchset-pf/fixes/0004-mm-khugepaged-fix-race-with-folio-split-free-using-t.patch
+patchset-pf/fixes/0005-mm-add-folio_expected_ref_count-for-reference-count-.patch
+patchset-pf/fixes/0006-drm-i915-snps_hdmi_pll-Fix-64-bit-divisor-truncation.patch
+patchset-pf/fixes/0007-mm-shmem-swap-fix-softlockup-with-mTHP-swapin.patch
+patchset-pf/fixes/0008-mm-gup-revert-mm-gup-fix-infinite-loop-within-__get_.patch
+patchset-pf/fixes/0009-mm-userfaultfd-fix-race-of-userfaultfd_move-and-swap.patch
+patchset-pf/fixes/0010-dm-raid-fix-variable-in-journal-device-check.patch

 patchset-zen/fixes/0001-drivers-firmware-skip-simpledrm-if-nvidia-drm.modese.patch
 patchset-zen/fixes/0002-x86-cpu-Help-users-notice-when-running-old-Intel-mic.patch
-patchset-zen/fixes/0003-drm-i915-snps_hdmi_pll-Fix-64-bit-divisor-truncation.patch
--- a/debian/rules.real
+++ b/debian/rules.real
@@ -225,7 +225,7 @@ define dh_binary_post
 	dh_lintian
 	dh_icons
 	dh_link
-	dh_compress
+	dh_compress $(DH_COMPRESS_ARGS)
 	dh_fixperms
 	dh_missing
 	dh_strip $(DH_STRIP_ARGS) -Xvmlinux -Xvmlinuz
@@ -491,6 +491,7 @@ binary_perf build_perf: export _PYTHON_SYSCONFIGDATA_NAME = _sysconfigdata__$(DE
 build_perf: $(STAMPS_DIR)/build-tools-headers
 	$(call make-tools,tools/perf)

+binary_perf: DH_COMPRESS_ARGS = -Xtips.txt
 binary_perf: DH_SHLIBDEPS_ARGS = -Xperf-read-vdso
 binary_perf: build_perf
 	$(dh_binary_pre)