6.5RC5

2023-08-10 18:30:38 +01:00 · 2023-08-10 18:30:38 +01:00 · 60dc452fb5
commit 60dc452fb5
parent 9ec4cbb0e4
7 changed files with 2915 additions and 5588 deletions
--- a/11
+++ b/11
@ -594,7 +594,9 @@ CONFIG_CALL_DEPTH_TRACKING=y
 # CONFIG_CALL_THUNKS_DEBUG is not set
 CONFIG_CPU_IBPB_ENTRY=y
 CONFIG_CPU_IBRS_ENTRY=y
 CONFIG_CPU_SRSO=y
 CONFIG_SLS=y
 # CONFIG_GDS_FORCE_MITIGATION is not set
 CONFIG_ARCH_HAS_ADD_PAGES=y
 CONFIG_ARCH_MHP_MEMMAP_ON_MEMORY_ENABLE=y
@ -1333,11 +1335,10 @@ CONFIG_TCP_CONG_YEAH=m
 CONFIG_TCP_CONG_ILLINOIS=m
 CONFIG_TCP_CONG_DCTCP=m
 CONFIG_TCP_CONG_CDG=m
-CONFIG_TCP_CONG_BBR=m
+CONFIG_TCP_CONG_BBR=y
-CONFIG_TCP_CONG_BBR2=y
+CONFIG_DEFAULT_BBR=y
 CONFIG_DEFAULT_BBR2=y
 # CONFIG_DEFAULT_RENO is not set
-CONFIG_DEFAULT_TCP_CONG="bbr2"
+CONFIG_DEFAULT_TCP_CONG="bbr"
 CONFIG_TCP_MD5SIG=y
 CONFIG_IPV6=y
 CONFIG_IPV6_ROUTER_PREF=y
@ -2613,7 +2614,7 @@ CONFIG_ZRAM_DEF_COMP_ZSTD=y
 # CONFIG_ZRAM_DEF_COMP_842 is not set
 CONFIG_ZRAM_DEF_COMP="zstd"
 CONFIG_ZRAM_WRITEBACK=y
-# CONFIG_ZRAM_MEMORY_TRACKING is not set
+CONFIG_ZRAM_MEMORY_TRACKING=y
 CONFIG_ZRAM_MULTI_COMP=y
 CONFIG_BLK_DEV_LOOP=m
 CONFIG_BLK_DEV_LOOP_MIN_COUNT=0
--- a/patches/0001-cachy-all.patch
+++ b/patches/0001-cachy-all.patch
--- a/patches/0002-eevdf.patch
+++ b/patches/0002-eevdf.patch
@ -1,7 +1,7 @@
-From 0af97bb369de3bfe15d724e9bb0e3c971c6f9f20 Mon Sep 17 00:00:00 2001
+From 218c51e49185b75b4e36c8f11b5c77686f955a0a Mon Sep 17 00:00:00 2001
 From: Peter Jung <admin@ptr1337.dev>
-Date: Mon, 10 Jul 2023 17:12:45 +0200
+Date: Sun, 30 Jul 2023 09:38:51 +0200
-Subject: [PATCH] EEVDF-cachy
+Subject: [PATCH] EEVDF
 Signed-off-by: Peter Jung <admin@ptr1337.dev>
 ---
@ -13,11 +13,11 @@ Signed-off-by: Peter Jung <admin@ptr1337.dev>
 init/init_task.c                        |    3 +-
 kernel/sched/core.c                     |   65 +-
 kernel/sched/debug.c                    |   49 +-
- kernel/sched/fair.c                     | 1157 +++++++++++------------
+ kernel/sched/fair.c                     | 1138 +++++++++++------------
- kernel/sched/features.h                 |   24 +-
+ kernel/sched/features.h                 |   23 +-
- kernel/sched/sched.h                    |   22 +-
+ kernel/sched/sched.h                    |   21 +-
 tools/include/uapi/linux/sched.h        |    4 +-
- 12 files changed, 733 insertions(+), 658 deletions(-)
+ 12 files changed, 702 insertions(+), 668 deletions(-)
 diff --git a/Documentation/admin-guide/cgroup-v2.rst b/Documentation/admin-guide/cgroup-v2.rst
 index 4ef890191196..3a8d3e1e5591 100644
@ -78,7 +78,7 @@ index 7ee7ed5de722..6dbc5a1bf6a8 100644
  * Template for declaring augmented rbtree callbacks (generic case)
  *
 diff --git a/include/linux/sched.h b/include/linux/sched.h
-index efc9f4bdc4ca..e99a9aa6a972 100644
+index 609bde814cb0..c940c4dc8304 100644
 --- a/include/linux/sched.h
 +++ b/include/linux/sched.h
@@ -549,13 +549,18 @@ struct sched_entity {
@ -196,7 +196,7 @@ index ff6c4b9bfe6b..511cbcf3510d 100644
 	.rt		= {
 		.run_list	= LIST_HEAD_INIT(init_task.rt.run_list),
 diff --git a/kernel/sched/core.c b/kernel/sched/core.c
-index 83e36547af17..8a541fe2d462 100644
+index c52c2eba7c73..aff81e12460e 100644
 --- a/kernel/sched/core.c
 +++ b/kernel/sched/core.c
@@ -1305,6 +1305,12 @@ static void set_load_weight(struct task_struct *p, bool update_load)
@ -232,7 +232,7 @@ index 83e36547af17..8a541fe2d462 100644
 		/*
 		 * We don't need the reset flag anymore after the fork. It has
-@@ -7529,7 +7539,7 @@ static struct task_struct *find_process_by_pid(pid_t pid)
+@@ -7516,7 +7526,7 @@ static struct task_struct *find_process_by_pid(pid_t pid)
 #define SETPARAM_POLICY	-1
 static void __setscheduler_params(struct task_struct *p,
@ -241,7 +241,7 @@ index 83e36547af17..8a541fe2d462 100644
 {
 	int policy = attr->sched_policy;
-@@ -7553,6 +7563,13 @@ static void __setscheduler_params(struct task_struct *p,
+@@ -7540,6 +7550,13 @@ static void __setscheduler_params(struct task_struct *p,
 	set_load_weight(p, true);
 }
@ -255,7 +255,7 @@ index 83e36547af17..8a541fe2d462 100644
 /*
  * Check the target process has a UID that matches the current process's:
  */
-@@ -7687,6 +7704,13 @@ static int __sched_setscheduler(struct task_struct *p,
+@@ -7674,6 +7691,13 @@ static int __sched_setscheduler(struct task_struct *p,
 			return retval;
 	}
@ -269,7 +269,7 @@ index 83e36547af17..8a541fe2d462 100644
 	/* Update task specific "requested" clamps */
 	if (attr->sched_flags & SCHED_FLAG_UTIL_CLAMP) {
 		retval = uclamp_validate(p, attr);
-@@ -7734,6 +7758,9 @@ static int __sched_setscheduler(struct task_struct *p,
+@@ -7721,6 +7745,9 @@ static int __sched_setscheduler(struct task_struct *p,
 			goto change;
 		if (attr->sched_flags & SCHED_FLAG_UTIL_CLAMP)
 			goto change;
@ -279,7 +279,7 @@ index 83e36547af17..8a541fe2d462 100644
 		p->sched_reset_on_fork = reset_on_fork;
 		retval = 0;
-@@ -7822,6 +7849,7 @@ static int __sched_setscheduler(struct task_struct *p,
+@@ -7809,6 +7836,7 @@ static int __sched_setscheduler(struct task_struct *p,
 		__setscheduler_params(p, attr);
 		__setscheduler_prio(p, newprio);
 	}
@ -287,7 +287,7 @@ index 83e36547af17..8a541fe2d462 100644
 	__setscheduler_uclamp(p, attr);
 	if (queued) {
-@@ -8033,6 +8061,9 @@ static int sched_copy_attr(struct sched_attr __user *uattr, struct sched_attr *a
+@@ -8020,6 +8048,9 @@ static int sched_copy_attr(struct sched_attr __user *uattr, struct sched_attr *a
 	    size < SCHED_ATTR_SIZE_VER1)
 		return -EINVAL;
@ -297,7 +297,7 @@ index 83e36547af17..8a541fe2d462 100644
 	/*
 	 * XXX: Do we want to be lenient like existing syscalls; or do we want
 	 * to be strict and return an error on out-of-bounds values?
-@@ -8270,6 +8301,8 @@ SYSCALL_DEFINE4(sched_getattr, pid_t, pid, struct sched_attr __user *, uattr,
+@@ -8257,6 +8288,8 @@ SYSCALL_DEFINE4(sched_getattr, pid_t, pid, struct sched_attr __user *, uattr,
 	get_params(p, &kattr);
 	kattr.sched_flags &= SCHED_FLAG_ALL;
@ -306,7 +306,7 @@ index 83e36547af17..8a541fe2d462 100644
 #ifdef CONFIG_UCLAMP_TASK
 	/*
 	 * This could race with another potential updater, but this is fine
-@@ -11214,6 +11247,25 @@ static int cpu_idle_write_s64(struct cgroup_subsys_state *css,
+@@ -11180,6 +11213,25 @@ static int cpu_idle_write_s64(struct cgroup_subsys_state *css,
 {
 	return sched_group_set_idle(css_tg(css), idle);
 }
@ -332,7 +332,7 @@ index 83e36547af17..8a541fe2d462 100644
 #endif
 static struct cftype cpu_legacy_files[] = {
-@@ -11228,6 +11280,11 @@ static struct cftype cpu_legacy_files[] = {
+@@ -11194,6 +11246,11 @@ static struct cftype cpu_legacy_files[] = {
 		.read_s64 = cpu_idle_read_s64,
 		.write_s64 = cpu_idle_write_s64,
 	},
@ -344,7 +344,7 @@ index 83e36547af17..8a541fe2d462 100644
 #endif
 #ifdef CONFIG_CFS_BANDWIDTH
 	{
-@@ -11467,6 +11524,12 @@ static struct cftype cpu_files[] = {
+@@ -11411,6 +11468,12 @@ static struct cftype cpu_files[] = {
 		.read_s64 = cpu_idle_read_s64,
 		.write_s64 = cpu_idle_write_s64,
 	},
@ -358,7 +358,7 @@ index 83e36547af17..8a541fe2d462 100644
 #ifdef CONFIG_CFS_BANDWIDTH
 	{
 diff --git a/kernel/sched/debug.c b/kernel/sched/debug.c
-index aeeba46a096b..5c743bcb340d 100644
+index 066ff1c8ae4e..e7e83181fbb6 100644
 --- a/kernel/sched/debug.c
 +++ b/kernel/sched/debug.c
@@ -347,10 +347,7 @@ static __init int sched_init_debug(void)
@ -373,7 +373,7 @@ index aeeba46a096b..5c743bcb340d 100644
 	debugfs_create_u32("latency_warn_ms", 0644, debugfs_sched, &sysctl_resched_latency_warn_ms);
 	debugfs_create_u32("latency_warn_once", 0644, debugfs_sched, &sysctl_resched_latency_warn_once);
-@@ -582,9 +579,13 @@ print_task(struct seq_file *m, struct rq *rq, struct task_struct *p)
+@@ -581,9 +578,13 @@ print_task(struct seq_file *m, struct rq *rq, struct task_struct *p)
 	else
 		SEQ_printf(m, " %c", task_state_to_char(p));
@ -388,7 +388,7 @@ index aeeba46a096b..5c743bcb340d 100644
 		(long long)(p->nvcsw + p->nivcsw),
 		p->prio);
-@@ -627,10 +628,9 @@ static void print_rq(struct seq_file *m, struct rq *rq, int rq_cpu)
+@@ -626,10 +627,9 @@ static void print_rq(struct seq_file *m, struct rq *rq, int rq_cpu)
 void print_cfs_rq(struct seq_file *m, int cpu, struct cfs_rq *cfs_rq)
 {
@ -401,7 +401,7 @@ index aeeba46a096b..5c743bcb340d 100644
 	unsigned long flags;
 #ifdef CONFIG_FAIR_GROUP_SCHED
-@@ -644,26 +644,25 @@ void print_cfs_rq(struct seq_file *m, int cpu, struct cfs_rq *cfs_rq)
+@@ -643,26 +643,25 @@ void print_cfs_rq(struct seq_file *m, int cpu, struct cfs_rq *cfs_rq)
 			SPLIT_NS(cfs_rq->exec_clock));
 	raw_spin_rq_lock_irqsave(rq, flags);
@ -441,7 +441,7 @@ index aeeba46a096b..5c743bcb340d 100644
 	SEQ_printf(m, "  .%-30s: %d\n", "nr_spread_over",
 			cfs_rq->nr_spread_over);
 	SEQ_printf(m, "  .%-30s: %d\n", "nr_running", cfs_rq->nr_running);
-@@ -864,10 +863,7 @@ static void sched_debug_header(struct seq_file *m)
+@@ -863,10 +862,7 @@ static void sched_debug_header(struct seq_file *m)
 	SEQ_printf(m, "  .%-40s: %Ld\n", #x, (long long)(x))
 #define PN(x) \
 	SEQ_printf(m, "  .%-40s: %Ld.%06ld\n", #x, SPLIT_NS(x))
@ -453,7 +453,7 @@ index aeeba46a096b..5c743bcb340d 100644
 	P(sysctl_sched_child_runs_first);
 	P(sysctl_sched_features);
 #undef PN
-@@ -1090,6 +1086,7 @@ void proc_sched_show_task(struct task_struct *p, struct pid_namespace *ns,
+@@ -1089,6 +1085,7 @@ void proc_sched_show_task(struct task_struct *p, struct pid_namespace *ns,
 #endif
 	P(policy);
 	P(prio);
@ -462,7 +462,7 @@ index aeeba46a096b..5c743bcb340d 100644
 		P(dl.runtime);
 		P(dl.deadline);
 diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c
-index 4039ff46fcb3..0fbb8fb24a50 100644
+index 2c335df30171..461409c0eac7 100644
 --- a/kernel/sched/fair.c
 +++ b/kernel/sched/fair.c
@@ -47,6 +47,7 @@
@ -594,7 +594,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 const struct sched_class fair_sched_class;
-@@ -619,13 +569,200 @@ static inline bool entity_before(const struct sched_entity *a,
+@@ -619,13 +569,198 @@ static inline bool entity_before(const struct sched_entity *a,
 	return (s64)(a->vruntime - b->vruntime) < 0;
 }
@ -671,7 +671,6 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 +	s64 key = entity_key(cfs_rq, se);
 +
 +	cfs_rq->avg_vruntime += key * weight;
 +	cfs_rq->avg_slice += se->slice * weight;
 +	cfs_rq->avg_load += weight;
 +}
 +
@ -682,7 +681,6 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 +	s64 key = entity_key(cfs_rq, se);
 +
 +	cfs_rq->avg_vruntime -= key * weight;
 +	cfs_rq->avg_slice -= se->slice * weight;
 +	cfs_rq->avg_load -= weight;
 +}
 +
@ -796,7 +794,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	u64 vruntime = cfs_rq->min_vruntime;
-@@ -636,9 +773,7 @@ static void update_min_vruntime(struct cfs_rq *cfs_rq)
+@@ -636,9 +771,7 @@ static void update_min_vruntime(struct cfs_rq *cfs_rq)
 			curr = NULL;
 	}
@ -807,7 +805,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 		if (!curr)
 			vruntime = se->vruntime;
 		else
-@@ -647,7 +782,7 @@ static void update_min_vruntime(struct cfs_rq *cfs_rq)
+@@ -647,7 +780,7 @@ static void update_min_vruntime(struct cfs_rq *cfs_rq)
 	/* ensure we never gain time by being placed backwards. */
 	u64_u32_store(cfs_rq->min_vruntime,
@ -816,7 +814,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 static inline bool __entity_less(struct rb_node *a, const struct rb_node *b)
-@@ -655,17 +790,51 @@ static inline bool __entity_less(struct rb_node *a, const struct rb_node *b)
+@@ -655,17 +788,51 @@ static inline bool __entity_less(struct rb_node *a, const struct rb_node *b)
 	return entity_before(__node_2_se(a), __node_2_se(b));
 }
@ -870,7 +868,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 struct sched_entity *__pick_first_entity(struct cfs_rq *cfs_rq)
-@@ -678,14 +847,81 @@ struct sched_entity *__pick_first_entity(struct cfs_rq *cfs_rq)
+@@ -678,14 +845,81 @@ struct sched_entity *__pick_first_entity(struct cfs_rq *cfs_rq)
 	return __node_2_se(left);
 }
@ -927,8 +925,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 +			if (best->deadline == best->min_deadline)
 +				break;
 +		}
- 
+
 -	return __node_2_se(next);
 +		/*
 +		 * If the earlest deadline in this subtree is in the fully
 +		 * eligible left half of our space, go there.
@ -941,7 +938,8 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 +
 +		node = node->rb_right;
 +	}
-+
+ 
 -	return __node_2_se(next);
 +	if (!best || (curr && deadline_gt(deadline, best, curr)))
 +		best = curr;
 +
@ -957,7 +955,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 #ifdef CONFIG_SCHED_DEBUG
-@@ -707,104 +943,53 @@ int sched_update_scaling(void)
+@@ -707,104 +941,53 @@ int sched_update_scaling(void)
 {
 	unsigned int factor = get_update_sysctl_factor();
@ -1090,7 +1088,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 #include "pelt.h"
-@@ -939,6 +1124,7 @@ static void update_curr(struct cfs_rq *cfs_rq)
+@@ -939,6 +1122,7 @@ static void update_curr(struct cfs_rq *cfs_rq)
 	schedstat_add(cfs_rq->exec_clock, delta_exec);
 	curr->vruntime += calc_delta_fair(delta_exec, curr);
@ -1098,7 +1096,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	update_min_vruntime(cfs_rq);
 	if (entity_is_task(curr)) {
-@@ -3393,16 +3579,36 @@ dequeue_load_avg(struct cfs_rq *cfs_rq, struct sched_entity *se) { }
+@@ -3393,16 +3577,36 @@ dequeue_load_avg(struct cfs_rq *cfs_rq, struct sched_entity *se) { }
 static void reweight_entity(struct cfs_rq *cfs_rq, struct sched_entity *se,
 			    unsigned long weight)
 {
@ -1135,7 +1133,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 #ifdef CONFIG_SMP
 	do {
 		u32 divider = get_pelt_divider(&se->avg);
-@@ -3412,9 +3618,11 @@ static void reweight_entity(struct cfs_rq *cfs_rq, struct sched_entity *se,
+@@ -3412,9 +3616,11 @@ static void reweight_entity(struct cfs_rq *cfs_rq, struct sched_entity *se,
 #endif
 	enqueue_load_avg(cfs_rq, se);
@ -1149,7 +1147,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 void reweight_task(struct task_struct *p, int prio)
-@@ -4710,98 +4918,140 @@ static inline void update_misfit_status(struct task_struct *p, struct rq *rq) {}
+@@ -4710,158 +4916,123 @@ static inline void update_misfit_status(struct task_struct *p, struct rq *rq) {}
 #endif /* CONFIG_SMP */
@ -1167,94 +1165,42 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 -}
 -
 -static inline bool entity_is_long_sleeper(struct sched_entity *se)
-+static inline bool
+static void
-+entity_has_slept(struct cfs_rq *cfs_rq, struct sched_entity *se, u64 vslice, int flags)
+place_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
 {
 -	struct cfs_rq *cfs_rq;
 -	u64 sleep_time;
 +	u64 now, vdelta;
 +	s64 delta;
 -	if (se->exec_start == 0)
 +	if (!(flags & ENQUEUE_WAKEUP))
 		return false;
 -	cfs_rq = cfs_rq_of(se);
 -
-	sleep_time = rq_clock_task(rq_of(cfs_rq));
+-	if (se->exec_start == 0)
 +	if (flags & ENQUEUE_MIGRATED)
 +		return true;
 -	/* Happen while migrating because of clock task divergence */
 -	if (sleep_time <= se->exec_start)
 +	now = rq_clock_task(rq_of(cfs_rq));
 +	delta = now - se->exec_start;
 +	if (delta < 0)
 		return false;
 -	sleep_time -= se->exec_start;
 -	if (sleep_time > ((1ULL << 63) / scale_load_down(NICE_0_LOAD)))
 -		return true;
 +	vdelta = __calc_delta(delta, NICE_0_LOAD, &cfs_rq->load);
 +	if (vdelta < vslice)
 +		return false;
 -		return false;
-+	return true;
+-
- }
+-	cfs_rq = cfs_rq_of(se);
 static void
 -place_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int initial)
 +place_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
 {
 -	u64 vruntime = cfs_rq->min_vruntime;
 +	u64 vslice = calc_delta_fair(se->slice, se);
 +	u64 vruntime = avg_vruntime(cfs_rq);
 +	s64 lag = 0;
- 	/*
+-	sleep_time = rq_clock_task(rq_of(cfs_rq));
-	 * The 'current' period is already promised to the current tasks,
+	/*
 -	 * however the extra weight of the new task will slow them down a
 -	 * little, place the new task so that it fits in the slot that
 -	 * stays open at the end.
 +	 * Due to how V is constructed as the weighted average of entities,
 +	 * adding tasks with positive lag, or removing tasks with negative lag
 +	 * will move 'time' backwards, this can screw around with the lag of
 +	 * other tasks.
 +	 *
 +	 * EEVDF: placement strategy #1 / #2
- 	 */
+	 */
 -	if (initial && sched_feat(START_DEBIT))
 -		vruntime += sched_vslice(cfs_rq, se);
 +	if (sched_feat(PLACE_LAG) && cfs_rq->nr_running) {
 +		struct sched_entity *curr = cfs_rq->curr;
 +		unsigned long load;
-	/* sleeps up to a single latency don't count. */
+-	/* Happen while migrating because of clock task divergence */
-	if (!initial) {
+-	if (sleep_time <= se->exec_start)
-		unsigned long thresh;
+-		return false;
 +		lag = se->vlag;
-		if (se_is_idle(se))
+-	sleep_time -= se->exec_start;
-			thresh = sysctl_sched_min_granularity;
+-	if (sleep_time > ((1ULL << 63) / scale_load_down(NICE_0_LOAD)))
-		else
+-		return true;
 -			thresh = sysctl_sched_latency;
 +		/*
 +		 * For latency sensitive tasks; those that have a shorter than
 +		 * average slice and do not fully consume the slice, transition
 +		 * to EEVDF placement strategy #2.
 +		 */
 +		if (sched_feat(PLACE_FUDGE) &&
 +		    (cfs_rq->avg_slice > se->slice * cfs_rq->avg_load) &&
 +		    entity_has_slept(cfs_rq, se, vslice, flags)) {
 +			lag += vslice;
 +			if (lag > 0)
 +				lag = 0;
 +		}
 		/*
 -		 * Halve their sleep time's effect, to allow
 -		 * for a gentler effect of sleepers:
 +		 * If we want to place a task and preserve lag, we have to
 +		 * consider the effect of the new entity on the weighted
 +		 * average and compensate for this, otherwise lag can quickly
@ -1305,7 +1251,52 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 +		 *                   = W*vl_i
 +		 *
 +		 *   vl_i = (W + w_i)*vl'_i / W
 +		 */
 +		load = cfs_rq->avg_load;
 +		if (curr && curr->on_rq)
 +			load += scale_load_down(curr->load.weight);
 -	return false;
 -}
 +		lag *= load + scale_load_down(se->load.weight);
 +		if (WARN_ON_ONCE(!load))
 +			load = 1;
 +		lag = div_s64(lag, load);
 +	}
 -static void
 -place_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int initial)
 -{
 -	u64 vruntime = cfs_rq->min_vruntime;
 +	se->vruntime = vruntime - lag;
 	/*
 -	 * The 'current' period is already promised to the current tasks,
 -	 * however the extra weight of the new task will slow them down a
 -	 * little, place the new task so that it fits in the slot that
 -	 * stays open at the end.
 +	 * When joining the competition; the exisiting tasks will be,
 +	 * on average, halfway through their slice, as such start tasks
 +	 * off with half a slice to ease into the competition.
 	 */
 -	if (initial && sched_feat(START_DEBIT))
 -		vruntime += sched_vslice(cfs_rq, se);
 -
 -	/* sleeps up to a single latency don't count. */
 -	if (!initial) {
 -		unsigned long thresh;
 -
 -		if (se_is_idle(se))
 -			thresh = sysctl_sched_min_granularity;
 -		else
 -			thresh = sysctl_sched_latency;
 +	if (sched_feat(PLACE_DEADLINE_INITIAL) && (flags & ENQUEUE_INITIAL))
 +		vslice /= 2;
 -		/*
 -		 * Halve their sleep time's effect, to allow
 -		 * for a gentler effect of sleepers:
 -		 */
 -		if (sched_feat(GENTLE_FAIR_SLEEPERS))
 -			thresh >>= 1;
 -
@ -1335,26 +1326,6 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 -		se->vruntime = vruntime;
 -	else
 -		se->vruntime = max_vruntime(se->vruntime, vruntime);
 +		load = cfs_rq->avg_load;
 +		if (curr && curr->on_rq)
 +			load += scale_load_down(curr->load.weight);
 +
 +		lag *= load + scale_load_down(se->load.weight);
 +		if (WARN_ON_ONCE(!load))
 +			load = 1;
 +		lag = div_s64(lag, load);
 +	}
 +
 +	se->vruntime = vruntime - lag;
 +
 +	/*
 +	 * When joining the competition; the exisiting tasks will be,
 +	 * on average, halfway through their slice, as such start tasks
 +	 * off with half a slice to ease into the competition.
 +	 */
 +	if (sched_feat(PLACE_DEADLINE_INITIAL) && (flags & ENQUEUE_INITIAL))
 +		vslice /= 2;
 +
 +	/*
 +	 * EEVDF: vd_i = ve_i + r_i/w_i
 +	 */
@ -1362,7 +1333,6 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 static void check_enqueue_throttle(struct cfs_rq *cfs_rq);
@@ -4809,60 +5059,20 @@ static inline int cfs_rq_throttled(struct cfs_rq *cfs_rq);
 static inline bool cfs_bandwidth_used(void);
@ -1425,7 +1395,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	/*
 	 * When enqueuing a sched_entity, we must:
 	 *   - Update loads to have both entity and cfs_rq synced with now.
-@@ -4874,18 +5084,28 @@ enqueue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
+@@ -4873,18 +5044,28 @@ enqueue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
 	 */
 	update_load_avg(cfs_rq, se, UPDATE_TG | DO_ATTACH);
 	se_update_runnable(se);
@ -1457,7 +1427,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	if (!curr)
 		__enqueue_entity(cfs_rq, se);
 	se->on_rq = 1;
-@@ -4907,17 +5127,6 @@ enqueue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
+@@ -4896,17 +5077,6 @@ enqueue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
 	}
 }
@ -1475,7 +1445,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 static void __clear_buddies_next(struct sched_entity *se)
 {
 	for_each_sched_entity(se) {
-@@ -4929,27 +5138,10 @@ static void __clear_buddies_next(struct sched_entity *se)
+@@ -4918,27 +5088,10 @@ static void __clear_buddies_next(struct sched_entity *se)
 	}
 }
@ -1503,7 +1473,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 static __always_inline void return_cfs_rq_runtime(struct cfs_rq *cfs_rq);
-@@ -4983,20 +5175,12 @@ dequeue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
+@@ -4972,20 +5125,12 @@ dequeue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
 	clear_buddies(cfs_rq, se);
@ -1525,7 +1495,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	/* return excess runtime on last dequeue */
 	return_cfs_rq_runtime(cfs_rq);
-@@ -5015,52 +5199,6 @@ dequeue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
+@@ -5004,52 +5149,6 @@ dequeue_entity(struct cfs_rq *cfs_rq, struct sched_entity *se, int flags)
 		update_idle_cfs_rq_clock_pelt(cfs_rq);
 }
@ -1578,7 +1548,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 static void
 set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
 {
-@@ -5099,9 +5237,6 @@ set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
+@@ -5088,9 +5187,6 @@ set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
 	se->prev_sum_exec_runtime = se->sum_exec_runtime;
 }
@ -1588,7 +1558,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 /*
  * Pick the next process, keeping these things in mind, in this order:
  * 1) keep things fair between processes/task groups
-@@ -5112,50 +5247,14 @@ wakeup_preempt_entity(struct sched_entity *curr, struct sched_entity *se);
+@@ -5101,50 +5197,14 @@ wakeup_preempt_entity(struct sched_entity *curr, struct sched_entity *se);
 static struct sched_entity *
 pick_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *curr)
 {
@ -1644,7 +1614,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 static bool check_cfs_rq_runtime(struct cfs_rq *cfs_rq);
-@@ -5172,8 +5271,6 @@ static void put_prev_entity(struct cfs_rq *cfs_rq, struct sched_entity *prev)
+@@ -5161,8 +5221,6 @@ static void put_prev_entity(struct cfs_rq *cfs_rq, struct sched_entity *prev)
 	/* throttle cfs_rqs exceeding runtime */
 	check_cfs_rq_runtime(cfs_rq);
@ -1653,7 +1623,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	if (prev->on_rq) {
 		update_stats_wait_start_fair(cfs_rq, prev);
 		/* Put 'current' back into the tree. */
-@@ -5214,9 +5311,6 @@ entity_tick(struct cfs_rq *cfs_rq, struct sched_entity *curr, int queued)
+@@ -5203,9 +5261,6 @@ entity_tick(struct cfs_rq *cfs_rq, struct sched_entity *curr, int queued)
 			hrtimer_active(&rq_of(cfs_rq)->hrtick_timer))
 		return;
 #endif
@ -1663,7 +1633,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
-@@ -6259,13 +6353,12 @@ static inline void unthrottle_offline_cfs_rqs(struct rq *rq) {}
+@@ -6228,13 +6283,12 @@ static inline void unthrottle_offline_cfs_rqs(struct rq *rq) {}
 static void hrtick_start_fair(struct rq *rq, struct task_struct *p)
 {
 	struct sched_entity *se = &p->se;
@ -1678,7 +1648,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 		s64 delta = slice - ran;
 		if (delta < 0) {
-@@ -6289,8 +6382,7 @@ static void hrtick_update(struct rq *rq)
+@@ -6258,8 +6312,7 @@ static void hrtick_update(struct rq *rq)
 	if (!hrtick_enabled_fair(rq) || curr->sched_class != &fair_sched_class)
 		return;
@ -1688,7 +1658,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 #else /* !CONFIG_SCHED_HRTICK */
 static inline void
-@@ -6331,17 +6423,6 @@ static int sched_idle_rq(struct rq *rq)
+@@ -6300,17 +6353,6 @@ static int sched_idle_rq(struct rq *rq)
 			rq->nr_running);
 }
@ -1706,7 +1676,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 #ifdef CONFIG_SMP
 static int sched_idle_cpu(int cpu)
 {
-@@ -7844,18 +7925,6 @@ static void migrate_task_rq_fair(struct task_struct *p, int new_cpu)
+@@ -7816,18 +7858,6 @@ static void migrate_task_rq_fair(struct task_struct *p, int new_cpu)
 {
 	struct sched_entity *se = &p->se;
@ -1725,7 +1695,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	if (!task_on_rq_migrating(p)) {
 		remove_entity_load_avg(se);
-@@ -7893,66 +7962,6 @@ balance_fair(struct rq *rq, struct task_struct *prev, struct rq_flags *rf)
+@@ -7865,66 +7895,6 @@ balance_fair(struct rq *rq, struct task_struct *prev, struct rq_flags *rf)
 }
 #endif /* CONFIG_SMP */
@ -1792,7 +1762,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 static void set_next_buddy(struct sched_entity *se)
 {
 	for_each_sched_entity(se) {
-@@ -7964,12 +7973,6 @@ static void set_next_buddy(struct sched_entity *se)
+@@ -7936,12 +7906,6 @@ static void set_next_buddy(struct sched_entity *se)
 	}
 }
@ -1805,7 +1775,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 /*
  * Preempt the current task with a newly woken task if needed:
  */
-@@ -7978,7 +7981,6 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
+@@ -7950,7 +7914,6 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
 	struct task_struct *curr = rq->curr;
 	struct sched_entity *se = &curr->se, *pse = &p->se;
 	struct cfs_rq *cfs_rq = task_cfs_rq(curr);
@ -1813,7 +1783,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	int next_buddy_marked = 0;
 	int cse_is_idle, pse_is_idle;
-@@ -7994,7 +7996,7 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
+@@ -7966,7 +7929,7 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
 	if (unlikely(throttled_hierarchy(cfs_rq_of(pse))))
 		return;
@ -1822,7 +1792,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 		set_next_buddy(pse);
 		next_buddy_marked = 1;
 	}
-@@ -8039,35 +8041,19 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
+@@ -8011,35 +7974,19 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
 	if (cse_is_idle != pse_is_idle)
 		return;
@ -1865,7 +1835,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 #ifdef CONFIG_SMP
-@@ -8268,8 +8254,6 @@ static void put_prev_task_fair(struct rq *rq, struct task_struct *prev)
+@@ -8240,8 +8187,6 @@ static void put_prev_task_fair(struct rq *rq, struct task_struct *prev)
 /*
  * sched_yield() is very simple
@ -1874,7 +1844,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
  */
 static void yield_task_fair(struct rq *rq)
 {
-@@ -8285,21 +8269,19 @@ static void yield_task_fair(struct rq *rq)
+@@ -8257,21 +8202,19 @@ static void yield_task_fair(struct rq *rq)
 	clear_buddies(cfs_rq, se);
@ -1908,7 +1878,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 static bool yield_to_task_fair(struct rq *rq, struct task_struct *p)
-@@ -8547,8 +8529,7 @@ static int task_hot(struct task_struct *p, struct lb_env *env)
+@@ -8514,8 +8457,7 @@ static int task_hot(struct task_struct *p, struct lb_env *env)
 	 * Buddy candidates are cache hot:
 	 */
 	if (sched_feat(CACHE_HOT_BUDDY) && env->dst_rq->nr_running &&
@ -1918,7 +1888,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 		return 1;
 	if (sysctl_sched_migration_cost == -1)
-@@ -12174,8 +12155,8 @@ static void rq_offline_fair(struct rq *rq)
+@@ -12025,8 +11967,8 @@ static void rq_offline_fair(struct rq *rq)
 static inline bool
 __entity_slice_used(struct sched_entity *se, int min_nr_tasks)
 {
@ -1928,7 +1898,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	return (rtime * min_nr_tasks > slice);
 }
-@@ -12331,8 +12312,8 @@ static void task_tick_fair(struct rq *rq, struct task_struct *curr, int queued)
+@@ -12182,8 +12124,8 @@ static void task_tick_fair(struct rq *rq, struct task_struct *curr, int queued)
  */
 static void task_fork_fair(struct task_struct *p)
 {
@ -1938,7 +1908,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	struct rq *rq = this_rq();
 	struct rq_flags rf;
-@@ -12341,22 +12322,9 @@ static void task_fork_fair(struct task_struct *p)
+@@ -12192,22 +12134,9 @@ static void task_fork_fair(struct task_struct *p)
 	cfs_rq = task_cfs_rq(current);
 	curr = cfs_rq->curr;
@ -1963,7 +1933,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	rq_unlock(rq, &rf);
 }
-@@ -12385,34 +12353,6 @@ prio_changed_fair(struct rq *rq, struct task_struct *p, int oldprio)
+@@ -12236,34 +12165,6 @@ prio_changed_fair(struct rq *rq, struct task_struct *p, int oldprio)
 		check_preempt_curr(rq, p, 0);
 }
@ -1998,7 +1968,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 #ifdef CONFIG_FAIR_GROUP_SCHED
 /*
  * Propagate the changes of the sched_entity across the tg tree to make it
-@@ -12483,16 +12423,6 @@ static void attach_entity_cfs_rq(struct sched_entity *se)
+@@ -12334,16 +12235,6 @@ static void attach_entity_cfs_rq(struct sched_entity *se)
 static void detach_task_cfs_rq(struct task_struct *p)
 {
 	struct sched_entity *se = &p->se;
@ -2015,7 +1985,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	detach_entity_cfs_rq(se);
 }
-@@ -12500,12 +12430,8 @@ static void detach_task_cfs_rq(struct task_struct *p)
+@@ -12351,12 +12242,8 @@ static void detach_task_cfs_rq(struct task_struct *p)
 static void attach_task_cfs_rq(struct task_struct *p)
 {
 	struct sched_entity *se = &p->se;
@ -2028,7 +1998,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 }
 static void switched_from_fair(struct rq *rq, struct task_struct *p)
-@@ -12616,6 +12542,7 @@ int alloc_fair_sched_group(struct task_group *tg, struct task_group *parent)
+@@ -12467,6 +12354,7 @@ int alloc_fair_sched_group(struct task_group *tg, struct task_group *parent)
 		goto err;
 	tg->shares = NICE_0_LOAD;
@ -2036,7 +2006,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	init_cfs_bandwidth(tg_cfs_bandwidth(tg));
-@@ -12714,6 +12641,9 @@ void init_tg_cfs_entry(struct task_group *tg, struct cfs_rq *cfs_rq,
+@@ -12565,6 +12453,9 @@ void init_tg_cfs_entry(struct task_group *tg, struct cfs_rq *cfs_rq,
 	}
 	se->my_q = cfs_rq;
@ -2046,7 +2016,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	/* guarantee group entities always have weight */
 	update_load_set(&se->load, NICE_0_LOAD);
 	se->parent = parent;
-@@ -12844,6 +12774,29 @@ int sched_group_set_idle(struct task_group *tg, long idle)
+@@ -12695,6 +12586,29 @@ int sched_group_set_idle(struct task_group *tg, long idle)
 	return 0;
 }
@ -2076,7 +2046,7 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 #else /* CONFIG_FAIR_GROUP_SCHED */
 void free_fair_sched_group(struct task_group *tg) { }
-@@ -12870,7 +12823,7 @@ static unsigned int get_rr_interval_fair(struct rq *rq, struct task_struct *task
+@@ -12721,7 +12635,7 @@ static unsigned int get_rr_interval_fair(struct rq *rq, struct task_struct *task
 	 * idle runqueue:
 	 */
 	if (rq->cfs.load.weight)
@ -2086,10 +2056,10 @@ index 4039ff46fcb3..0fbb8fb24a50 100644
 	return rr_interval;
 }
 diff --git a/kernel/sched/features.h b/kernel/sched/features.h
-index ee7f23c76bd3..7d65b40299d9 100644
+index ee7f23c76bd3..54334ca5c5c6 100644
 --- a/kernel/sched/features.h
 +++ b/kernel/sched/features.h
-@@ -1,16 +1,12 @@
+@@ -1,16 +1,11 @@
 /* SPDX-License-Identifier: GPL-2.0 */
 -/*
 - * Only give sleepers 50% of their service deficit. This allows
@ -2106,12 +2076,11 @@ index ee7f23c76bd3..7d65b40299d9 100644
  */
 -SCHED_FEAT(START_DEBIT, true)
 +SCHED_FEAT(PLACE_LAG, true)
 +SCHED_FEAT(PLACE_FUDGE, true)
 +SCHED_FEAT(PLACE_DEADLINE_INITIAL, true)
 /*
  * Prefer to schedule the task we woke last (assuming it failed
-@@ -19,13 +15,6 @@ SCHED_FEAT(START_DEBIT, true)
+@@ -19,13 +14,6 @@ SCHED_FEAT(START_DEBIT, true)
  */
 SCHED_FEAT(NEXT_BUDDY, false)
@ -2125,7 +2094,7 @@ index ee7f23c76bd3..7d65b40299d9 100644
 /*
  * Consider buddies to be cache hot, decreases the likeliness of a
  * cache buddy being migrated away, increases cache locality.
-@@ -98,6 +87,3 @@ SCHED_FEAT(UTIL_EST, true)
+@@ -98,6 +86,3 @@ SCHED_FEAT(UTIL_EST, true)
 SCHED_FEAT(UTIL_EST_FASTUP, true)
 SCHED_FEAT(LATENCY_WARN, false)
@ -2133,7 +2102,7 @@ index ee7f23c76bd3..7d65b40299d9 100644
 -SCHED_FEAT(ALT_PERIOD, true)
 -SCHED_FEAT(BASE_SLICE, true)
 diff --git a/kernel/sched/sched.h b/kernel/sched/sched.h
-index 9baeb1a2dfdd..4236c4c893aa 100644
+index e93e006a942b..67cd7e1fd501 100644
 --- a/kernel/sched/sched.h
 +++ b/kernel/sched/sched.h
@@ -372,6 +372,8 @@ struct task_group {
@ -2154,18 +2123,17 @@ index 9baeb1a2dfdd..4236c4c893aa 100644
 #ifdef CONFIG_SMP
 extern void set_task_rq_fair(struct sched_entity *se,
 			     struct cfs_rq *prev, struct cfs_rq *next);
-@@ -548,6 +552,10 @@ struct cfs_rq {
+@@ -548,6 +552,9 @@ struct cfs_rq {
 	unsigned int		idle_nr_running;   /* SCHED_IDLE */
 	unsigned int		idle_h_nr_running; /* SCHED_IDLE */
 +	s64			avg_vruntime;
 +	u64			avg_slice;
 +	u64			avg_load;
 +
 	u64			exec_clock;
 	u64			min_vruntime;
 #ifdef CONFIG_SCHED_CORE
-@@ -567,8 +575,6 @@ struct cfs_rq {
+@@ -567,8 +574,6 @@ struct cfs_rq {
 	 */
 	struct sched_entity	*curr;
 	struct sched_entity	*next;
@ -2174,7 +2142,7 @@ index 9baeb1a2dfdd..4236c4c893aa 100644
 #ifdef	CONFIG_SCHED_DEBUG
 	unsigned int		nr_spread_over;
-@@ -2198,6 +2204,7 @@ extern const u32		sched_prio_to_wmult[40];
+@@ -2195,6 +2200,7 @@ extern const u32		sched_prio_to_wmult[40];
 #else
 #define ENQUEUE_MIGRATED	0x00
 #endif
@ -2182,7 +2150,7 @@ index 9baeb1a2dfdd..4236c4c893aa 100644
 #define RETRY_TASK		((void *)-1UL)
-@@ -2502,11 +2509,9 @@ extern void check_preempt_curr(struct rq *rq, struct task_struct *p, int flags);
+@@ -2499,11 +2505,9 @@ extern void check_preempt_curr(struct rq *rq, struct task_struct *p, int flags);
 extern const_debug unsigned int sysctl_sched_nr_migrate;
 extern const_debug unsigned int sysctl_sched_migration_cost;
@ -2196,7 +2164,7 @@ index 9baeb1a2dfdd..4236c4c893aa 100644
 extern int sysctl_resched_latency_warn_ms;
 extern int sysctl_resched_latency_warn_once;
-@@ -2519,6 +2524,8 @@ extern unsigned int sysctl_numa_balancing_scan_size;
+@@ -2516,6 +2520,8 @@ extern unsigned int sysctl_numa_balancing_scan_size;
 extern unsigned int sysctl_numa_balancing_hot_threshold;
 #endif
@ -2205,7 +2173,7 @@ index 9baeb1a2dfdd..4236c4c893aa 100644
 #ifdef CONFIG_SCHED_HRTICK
 /*
-@@ -3483,4 +3490,7 @@ static inline void task_tick_mm_cid(struct rq *rq, struct task_struct *curr) { }
+@@ -3480,4 +3486,7 @@ static inline void task_tick_mm_cid(struct rq *rq, struct task_struct *curr) { }
 static inline void init_sched_mm_cid(struct task_struct *t) { }
 #endif
--- a/patches/0002-eevdfbore.patch
+++ b/patches/0002-eevdfbore.patch
@ -1,49 +1,76 @@
-From e6e251fb3f3927c18ac4f2a22a43c6c198133d19 Mon Sep 17 00:00:00 2001
+From 377657f92d256b364813e3f8b2a58edfc9833815 Mon Sep 17 00:00:00 2001
-From: Piotr Gorski <lucjan.lucjanov@gmail.com>
+From: Peter Jung <admin@ptr1337.dev>
-Date: Sun, 23 Jul 2023 09:46:42 +0200
+Date: Sun, 30 Jul 2023 09:43:51 +0200
 Subject: [PATCH] bore-eevdf
-Signed-off-by: Piotr Gorski <lucjan.lucjanov@gmail.com>
+Signed-off-by: Peter Jung <admin@ptr1337.dev>
 ---
- include/linux/sched.h   |  10 ++
+ include/linux/sched.h   |  30 ++++++
 init/Kconfig            |  20 ++++
- kernel/sched/core.c     | 117 +++++++++++++++++++++++
+ kernel/sched/core.c     | 118 +++++++++++++++++++++
 kernel/sched/debug.c    |   4 +
- kernel/sched/fair.c     | 203 ++++++++++++++++++++++++++++++++++++++--
+ kernel/sched/fair.c     | 228 ++++++++++++++++++++++++++++++++++++++--
 kernel/sched/features.h |   4 +
 kernel/sched/sched.h    |   1 +
- 7 files changed, 351 insertions(+), 8 deletions(-)
+ 7 files changed, 397 insertions(+), 8 deletions(-)
 diff --git a/include/linux/sched.h b/include/linux/sched.h
-index e99a9aa6a..14a1ce058 100644
+index c940c4dc8304..8663c0813f81 100644
 --- a/include/linux/sched.h
 +++ b/include/linux/sched.h
-@@ -559,6 +559,12 @@ struct sched_entity {
+@@ -545,6 +545,26 @@ struct sched_statistics {
 #endif /* CONFIG_SCHEDSTATS */
 } ____cacheline_aligned;
 +#ifdef CONFIG_SCHED_BORE
 +union union16 {
 +	u16	u16;
 +	s16	s16;
 +	u8	u8[2];
 +	s8	s8[2];
 +};
 +typedef union union16 x16;
 +
 +union union32 {
 +	u32	u32;
 +	s32	s32;
 +	u16	u16[2];
 +	s16	s16[2];
 +	u8	u8[4];
 +	s8	s8[4];
 +};
 +typedef union union32 x32;
 +#endif // CONFIG_SCHED_BORE
 +
 struct sched_entity {
 	/* For load-balancing: */
 	struct load_weight		load;
@@ -559,6 +579,12 @@ struct sched_entity {
 	u64				sum_exec_runtime;
 	u64				prev_sum_exec_runtime;
 	u64				vruntime;
 +#ifdef CONFIG_SCHED_BORE
 +	u64				prev_burst_time;
 +	u64				burst_time;
-+	u64				max_burst_time;
+	u16				prev_burst_penalty;
-+	u8				penalty_score;
+	u16				curr_burst_penalty;
 +	u16				burst_penalty;
 +#endif // CONFIG_SCHED_BORE
 	s64				vlag;
 	u64				slice;
-@@ -990,6 +996,10 @@ struct task_struct {
+@@ -990,6 +1016,10 @@ struct task_struct {
 	struct list_head		children;
 	struct list_head		sibling;
 	struct task_struct		*group_leader;
 +#ifdef CONFIG_SCHED_BORE
-+	u64	child_burst_cache;
+	u16	child_burst_cache;
 +	u64	child_burst_last_cached;
 +#endif // CONFIG_SCHED_BORE
 	/*
 	 * 'ptraced' is the list of tasks this task is using ptrace() on.
 diff --git a/init/Kconfig b/init/Kconfig
-index 71755cc8e..c697be79e 100644
+index 71755cc8ed3e..c697be79e594 100644
 --- a/init/Kconfig
 +++ b/init/Kconfig
@@ -1277,6 +1277,26 @@ config CHECKPOINT_RESTORE
@ -74,30 +101,31 @@ index 71755cc8e..c697be79e 100644
 	bool "Automatic process group scheduling"
 	select CGROUPS
 diff --git a/kernel/sched/core.c b/kernel/sched/core.c
-index 8a541fe2d..13969a3a3 100644
+index aff81e12460e..839605620f63 100644
 --- a/kernel/sched/core.c
 +++ b/kernel/sched/core.c
-@@ -4491,6 +4491,112 @@ int wake_up_state(struct task_struct *p, unsigned int state)
+@@ -4491,6 +4491,113 @@ int wake_up_state(struct task_struct *p, unsigned int state)
 	return try_to_wake_up(p, state, 0);
 }
 +#ifdef CONFIG_SCHED_BORE
 +#define CHILD_BURST_CUTOFF_BITS 9
 +extern unsigned int sched_burst_cache_lifetime;
 +extern unsigned int sched_burst_fork_atavistic;
 +
 +void __init sched_init_bore(void) {
 +	init_task.child_burst_cache = 0;
 +	init_task.child_burst_last_cached = 0;
 +	init_task.se.prev_burst_time = 0;
 +	init_task.se.burst_time = 0;
-+	init_task.se.max_burst_time = 0;
+	init_task.se.prev_burst_penalty = 0;
 +	init_task.se.curr_burst_penalty = 0;
 +	init_task.se.burst_penalty = 0;
 +}
 +
 +void inline sched_fork_bore(struct task_struct *p) {
 +	p->child_burst_cache = 0;
 +	p->child_burst_last_cached = 0;
 +	p->se.burst_time = 0;
 +	p->se.curr_burst_penalty = 0;
 +}
 +
 +static u32 count_child_tasks(struct task_struct *p) {
@ -112,31 +140,31 @@ index 8a541fe2d..13969a3a3 100644
 +}
 +
 +static void __update_child_burst_cache(
-+	struct task_struct *p, u32 cnt, u64 sum, u64 now) {
+	struct task_struct *p, u32 cnt, u32 sum, u64 now) {
-+	u64 avg = 0;
+	u16 avg = 0;
-+	if (cnt) avg = div_u64(sum, cnt) << CHILD_BURST_CUTOFF_BITS;
+	if (cnt) avg = DIV_ROUND_CLOSEST(sum, cnt);
-+	p->child_burst_cache = max(avg, p->se.max_burst_time);
+	p->child_burst_cache = max(avg, p->se.burst_penalty);
 +	p->child_burst_last_cached = now;
 +}
 +
 +static void update_child_burst_cache(struct task_struct *p, u64 now) {
 +	struct task_struct *child;
 +	u32 cnt = 0;
-+	u64 sum = 0;
+	u32 sum = 0;
 +
 +	list_for_each_entry(child, &p->children, sibling) {
 +		cnt++;
-+		sum += child->se.max_burst_time >> CHILD_BURST_CUTOFF_BITS;
+		sum += child->se.burst_penalty;
 +	}
 +
 +	__update_child_burst_cache(p, cnt, sum, now);
 +}
 +
 +static void update_child_burst_cache_atavistic(
-+	struct task_struct *p, u64 now, u32 depth, u32 *acnt, u64 *asum) {
+	struct task_struct *p, u64 now, u32 depth, u32 *acnt, u32 *asum) {
 +	struct task_struct *child, *dec;
 +	u32 cnt = 0, dcnt = 0;
-+	u64 sum = 0;
+	u32 sum = 0;
 +
 +	list_for_each_entry(child, &p->children, sibling) {
 +		dec = child;
@ -145,13 +173,13 @@ index 8a541fe2d..13969a3a3 100644
 +		
 +		if (!dcnt || !depth) {
 +			cnt++;
-+			sum += dec->se.max_burst_time >> CHILD_BURST_CUTOFF_BITS;
+			sum += dec->se.burst_penalty;
 +		} else {
 +			if (child_burst_cache_expired(dec, now))
 +				update_child_burst_cache_atavistic(dec, now, depth - 1, &cnt, &sum);
 +			else {
 +				cnt += dcnt;
-+				sum += (dec->child_burst_cache >> CHILD_BURST_CUTOFF_BITS) * dcnt;
+				sum += (dec->child_burst_cache) * dcnt;
 +			}
 +		}
 +	}
@ -161,12 +189,12 @@ index 8a541fe2d..13969a3a3 100644
 +	*asum += sum;
 +}
 +
-+static void update_task_initial_burst_time(struct task_struct *p) {
+static void fork_burst_penalty(struct task_struct *p) {
 +	struct sched_entity *se = &p->se;
 +	struct task_struct *anc = p->real_parent;
 +	u64 now = ktime_get_ns();
 +	u32 cnt = 0;
-+	u64 sum = 0;
+	u32 sum = 0;
 +
 +	read_lock(&tasklist_lock);
 +	
@ -182,15 +210,15 @@ index 8a541fe2d..13969a3a3 100644
 +
 +	read_unlock(&tasklist_lock);
 +
-+	se->max_burst_time = se->prev_burst_time =
+	se->burst_penalty = se->prev_burst_penalty =
-+		max(se->prev_burst_time, anc->child_burst_cache);
+		max(se->prev_burst_penalty, anc->child_burst_cache);
 +}
 +#endif // CONFIG_SCHED_BORE
 +
 /*
  * Perform scheduler related setup for a newly forked process p.
  * p is forked by current.
-@@ -4507,6 +4613,9 @@ static void __sched_fork(unsigned long clone_flags, struct task_struct *p)
+@@ -4507,6 +4614,9 @@ static void __sched_fork(unsigned long clone_flags, struct task_struct *p)
 	p->se.prev_sum_exec_runtime	= 0;
 	p->se.nr_migrations		= 0;
 	p->se.vruntime			= 0;
@ -200,30 +228,30 @@ index 8a541fe2d..13969a3a3 100644
 	p->se.vlag			= 0;
 	INIT_LIST_HEAD(&p->se.group_node);
-@@ -4828,6 +4937,9 @@ void sched_cgroup_fork(struct task_struct *p, struct kernel_clone_args *kargs)
+@@ -4828,6 +4938,9 @@ void sched_cgroup_fork(struct task_struct *p, struct kernel_clone_args *kargs)
 void sched_post_fork(struct task_struct *p)
 {
 +#ifdef CONFIG_SCHED_BORE
-+	update_task_initial_burst_time(p);
+	fork_burst_penalty(p);
 +#endif // CONFIG_SCHED_BORE
 	uclamp_post_fork(p);
 }
-@@ -9967,6 +10079,11 @@ void __init sched_init(void)
+@@ -9954,6 +10067,11 @@ void __init sched_init(void)
 	BUG_ON(&dl_sched_class != &stop_sched_class + 1);
 #endif
 +#ifdef CONFIG_SCHED_BORE
 +	sched_init_bore();
-+	printk(KERN_INFO "BORE (Burst-Oriented Response Enhancer) CPU Scheduler modification 2.5.3 by Masahito Suzuki");
+	printk(KERN_INFO "BORE (Burst-Oriented Response Enhancer) CPU Scheduler modification 3.0 Beta2 by Masahito Suzuki");
 +#endif // CONFIG_SCHED_BORE
 +
 	wait_bit_init();
 #ifdef CONFIG_FAIR_GROUP_SCHED
 diff --git a/kernel/sched/debug.c b/kernel/sched/debug.c
-index 5c743bcb3..755ef4c8d 100644
+index e7e83181fbb6..ff41a524c1ee 100644
 --- a/kernel/sched/debug.c
 +++ b/kernel/sched/debug.c
@@ -348,6 +348,7 @@ static __init int sched_init_debug(void)
@ -234,18 +262,18 @@ index 5c743bcb3..755ef4c8d 100644
 	debugfs_create_u32("latency_warn_ms", 0644, debugfs_sched, &sysctl_resched_latency_warn_ms);
 	debugfs_create_u32("latency_warn_once", 0644, debugfs_sched, &sysctl_resched_latency_warn_once);
-@@ -595,6 +596,9 @@ print_task(struct seq_file *m, struct rq *rq, struct task_struct *p)
+@@ -594,6 +595,9 @@ print_task(struct seq_file *m, struct rq *rq, struct task_struct *p)
 		SPLIT_NS(schedstat_val_or_zero(p->stats.sum_sleep_runtime)),
 		SPLIT_NS(schedstat_val_or_zero(p->stats.sum_block_runtime)));
 +#ifdef CONFIG_SCHED_BORE
-+	SEQ_printf(m, " %2d", p->se.penalty_score);
+	SEQ_printf(m, " %2d", ((x16*)&p->se.burst_penalty)->u8[1]);
 +#endif
 #ifdef CONFIG_NUMA_BALANCING
 	SEQ_printf(m, " %d %d", task_node(p), task_numa_group_id(p));
 #endif
 diff --git a/kernel/sched/fair.c b/kernel/sched/fair.c
-index d6042543c..e52c14232 100644
+index 461409c0eac7..90ce27fb0a3f 100644
 --- a/kernel/sched/fair.c
 +++ b/kernel/sched/fair.c
@@ -19,6 +19,9 @@
@ -281,7 +309,7 @@ index d6042543c..e52c14232 100644
 /*
  * After fork, child runs first. If set to 0 (default) then
-@@ -84,8 +87,76 @@ static unsigned int normalized_sysctl_sched_base_slice	= 750000ULL;
+@@ -84,8 +87,93 @@ static unsigned int normalized_sysctl_sched_base_slice	= 750000ULL;
  */
 unsigned int sysctl_sched_child_runs_first __read_mostly;
@ -292,55 +320,72 @@ index d6042543c..e52c14232 100644
 + * and reduces their over-scheduling. Synchronous workloads will still
 + * have immediate wakeup/sleep latencies.
 + *
-+ * (default: 3.2 msec * 1, units: nanoseconds)
+ * (default: 1.6 msec * 1, units: nanoseconds)
 + */
-+unsigned int sysctl_sched_wakeup_granularity			= 3200000UL;
+unsigned int sysctl_sched_wakeup_granularity			= 1600000UL;
-+static unsigned int normalized_sysctl_sched_wakeup_granularity	= 3200000UL;
+static unsigned int normalized_sysctl_sched_wakeup_granularity	= 1600000UL;
 +
 const_debug unsigned int sysctl_sched_migration_cost	= 500000UL;
 +#ifdef CONFIG_SCHED_BORE
 +unsigned int __read_mostly sched_bore                  = 1;
 +unsigned int __read_mostly sched_burst_cache_lifetime  = 60000000;
-+unsigned int __read_mostly sched_burst_penalty_offset = 12;
+unsigned int __read_mostly sched_burst_penalty_offset  = 18;
 +unsigned int __read_mostly sched_burst_penalty_scale   = 1292;
-+unsigned int __read_mostly sched_burst_smoothness     = 2;
+unsigned int __read_mostly sched_burst_smoothness_up   = 1;
 +unsigned int __read_mostly sched_burst_smoothness_down = 0;
 +unsigned int __read_mostly sched_burst_fork_atavistic  = 2;
 +static int three          = 3;
 +static int sixty_four     = 64;
 +static int maxval_12_bits = 4095;
 +
-+#define FIXED_SHIFT 10
+#define MAX_BURST_PENALTY ((u32)(40UL << 8) - 1)
 +#define FIXED_ONE (1 << FIXED_SHIFT)
 +typedef u32 fixed;
 +
-+static void update_burst_score(struct sched_entity *se) {
+static inline u32 log2plus1_u64_u32f8(u64 v) {
-+	u64 burst_time = se->max_burst_time;
+	x32 result;
 +	int msb = fls64(v);
 +	result.u8[0] = v << (64 - msb) >> 55;
 +	result.u8[1] = msb;
 +	return result.u32;
 +}
 +
-+	int msb = fls64(burst_time);
+static inline u32 u8h_u32(u8 v) {
-+	fixed integer_part = msb << FIXED_SHIFT;
+	x32 result;
-+	fixed fractional_part = burst_time << (64 - msb) << 1 >> (64 - FIXED_SHIFT);
+	result.u8[1] = v;
-+	fixed greed = integer_part | fractional_part;
+	return result.u32;
 +}
 +
-+	fixed tolerance = sched_burst_penalty_offset << FIXED_SHIFT;
+static inline u32 calc_burst_penalty(struct sched_entity *se) {
-+	fixed penalty = max(0, (s32)greed - (s32)tolerance);
+	u32 greed, tolerance, penalty, scaled_penalty;
 +	fixed scaled_penalty = penalty * sched_burst_penalty_scale >> 10;
 +	
-+	u8 score = min(39U, scaled_penalty >> FIXED_SHIFT);
+	greed = log2plus1_u64_u32f8(se->burst_time);
-+	se->penalty_score = score;
+	tolerance = u8h_u32(sched_burst_penalty_offset);
 +	penalty = max(0, (s32)greed - (s32)tolerance);
 +	scaled_penalty = penalty * sched_burst_penalty_scale >> 10;
 +
 +	return min(MAX_BURST_PENALTY, scaled_penalty);
 +}
 +
 +static void update_burst_penalty(struct sched_entity *se) {
 +	se->curr_burst_penalty = calc_burst_penalty(se);
 +	se->burst_penalty = max(se->prev_burst_penalty, se->curr_burst_penalty);
 +}
 +
 +static inline u64 penalty_scale(u64 delta, struct sched_entity *se) {
-+	return mul_u64_u32_shr(delta, sched_prio_to_wmult[se->penalty_score], 22);
+	u8 score = ((x16*)&se->burst_penalty)->u8[1];
 +	return mul_u64_u32_shr(delta, sched_prio_to_wmult[score], 22);
 +}
 +
-+static inline u64 __binary_smooth(u64 new, u64 old, unsigned int smoothness) {
+static inline u32 binary_smooth(u32 new, u32 old) {
-+	return (new <= old)? new: (new + old * ((1 << smoothness) - 1)) >> smoothness;
+  return (new >= old)?
 +    old + ((new - old) >> sched_burst_smoothness_up):
 +    old - ((old - new) >> sched_burst_smoothness_down);
 +}
 +
-+void restart_burst(struct sched_entity *se) {
+static void restart_burst(struct sched_entity *se) {
-+	se->max_burst_time = se->prev_burst_time = __binary_smooth(
+	se->burst_penalty = se->prev_burst_penalty =
-+		se->burst_time, se->prev_burst_time, sched_burst_smoothness);
+		binary_smooth(se->curr_burst_penalty, se->prev_burst_penalty);
 +	se->curr_burst_penalty = 0;
 +	se->burst_time = 0;
 +}
 +
@ -358,7 +403,7 @@ index d6042543c..e52c14232 100644
 int sched_thermal_decay_shift;
 static int __init setup_sched_thermal_decay_shift(char *str)
 {
-@@ -145,6 +216,60 @@ static unsigned int sysctl_numa_balancing_promote_rate_limit = 65536;
+@@ -145,6 +233,69 @@ static unsigned int sysctl_numa_balancing_promote_rate_limit = 65536;
 #ifdef CONFIG_SYSCTL
 static struct ctl_table sched_fair_sysctls[] = {
@ -407,8 +452,17 @@ index d6042543c..e52c14232 100644
 +		.extra2		= &maxval_12_bits,
 +	},
 +	{
-+		.procname	= "sched_burst_smoothness",
+		.procname	= "sched_burst_smoothness_down",
-+		.data		= &sched_burst_smoothness,
+		.data		= &sched_burst_smoothness_down,
 +		.maxlen		= sizeof(unsigned int),
 +		.mode		= 0644,
 +		.proc_handler	= &proc_dointvec_minmax,
 +		.extra1		= SYSCTL_ZERO,
 +		.extra2		= &three,
 +	},
 +	{
 +		.procname	= "sched_burst_smoothness_up",
 +		.data		= &sched_burst_smoothness_up,
 +		.maxlen		= sizeof(unsigned int),
 +		.mode		= 0644,
 +		.proc_handler	= &proc_dointvec_minmax,
@ -419,7 +473,7 @@ index d6042543c..e52c14232 100644
 	{
 		.procname       = "sched_child_runs_first",
 		.data           = &sysctl_sched_child_runs_first,
-@@ -238,6 +363,7 @@ static void update_sysctl(void)
+@@ -238,6 +389,7 @@ static void update_sysctl(void)
 #define SET_SYSCTL(name) \
 	(sysctl_##name = (factor) * normalized_sysctl_##name)
 	SET_SYSCTL(sched_base_slice);
@ -427,7 +481,7 @@ index d6042543c..e52c14232 100644
 #undef SET_SYSCTL
 }
-@@ -308,11 +434,19 @@ static u64 __calc_delta(u64 delta_exec, unsigned long weight, struct load_weight
+@@ -308,11 +460,19 @@ static u64 __calc_delta(u64 delta_exec, unsigned long weight, struct load_weight
 /*
  * delta /= w
  */
@ -447,7 +501,7 @@ index d6042543c..e52c14232 100644
 	return delta;
 }
-@@ -708,7 +842,11 @@ void update_entity_lag(struct cfs_rq *cfs_rq, struct sched_entity *se)
+@@ -706,7 +866,11 @@ void update_entity_lag(struct cfs_rq *cfs_rq, struct sched_entity *se)
 	SCHED_WARN_ON(!se->on_rq);
 	lag = avg_vruntime(cfs_rq) - se->vruntime;
@ -459,7 +513,7 @@ index d6042543c..e52c14232 100644
 	se->vlag = clamp(lag, -limit, limit);
 }
-@@ -946,6 +1084,7 @@ int sched_update_scaling(void)
+@@ -944,6 +1108,7 @@ int sched_update_scaling(void)
 #define WRT_SYSCTL(name) \
 	(normalized_sysctl_##name = sysctl_##name / (factor))
 	WRT_SYSCTL(sched_base_slice);
@ -467,19 +521,18 @@ index d6042543c..e52c14232 100644
 #undef WRT_SYSCTL
 	return 0;
-@@ -1123,6 +1262,11 @@ static void update_curr(struct cfs_rq *cfs_rq)
+@@ -1121,6 +1286,10 @@ static void update_curr(struct cfs_rq *cfs_rq)
 	curr->sum_exec_runtime += delta_exec;
 	schedstat_add(cfs_rq->exec_clock, delta_exec);
 +#ifdef CONFIG_SCHED_BORE
 +	curr->burst_time += delta_exec;
-+	curr->max_burst_time = max(curr->max_burst_time, curr->burst_time);
+	update_burst_penalty(curr);
 +	update_burst_score(curr);
 +#endif // CONFIG_SCHED_BORE
 	curr->vruntime += calc_delta_fair(delta_exec, curr);
 	update_deadline(cfs_rq, curr);
 	update_min_vruntime(cfs_rq);
-@@ -5237,6 +5381,9 @@ set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
+@@ -5187,6 +5356,9 @@ set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
 	se->prev_sum_exec_runtime = se->sum_exec_runtime;
 }
@ -489,7 +542,7 @@ index d6042543c..e52c14232 100644
 /*
  * Pick the next process, keeping these things in mind, in this order:
  * 1) keep things fair between processes/task groups
-@@ -5247,14 +5394,16 @@ set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
+@@ -5197,14 +5369,16 @@ set_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *se)
 static struct sched_entity *
 pick_next_entity(struct cfs_rq *cfs_rq, struct sched_entity *curr)
 {
@ -508,7 +561,7 @@ index d6042543c..e52c14232 100644
 }
 static bool check_cfs_rq_runtime(struct cfs_rq *cfs_rq);
-@@ -6522,6 +6671,38 @@ enqueue_task_fair(struct rq *rq, struct task_struct *p, int flags)
+@@ -6452,6 +6626,38 @@ enqueue_task_fair(struct rq *rq, struct task_struct *p, int flags)
 	hrtick_update(rq);
 }
@ -547,7 +600,7 @@ index d6042543c..e52c14232 100644
 static void set_next_buddy(struct sched_entity *se);
 /*
-@@ -6540,6 +6721,9 @@ static void dequeue_task_fair(struct rq *rq, struct task_struct *p, int flags)
+@@ -6470,6 +6676,9 @@ static void dequeue_task_fair(struct rq *rq, struct task_struct *p, int flags)
 	util_est_dequeue(&rq->cfs, p);
 	for_each_sched_entity(se) {
@ -557,7 +610,7 @@ index d6042543c..e52c14232 100644
 		cfs_rq = cfs_rq_of(se);
 		dequeue_entity(cfs_rq, se, flags);
-@@ -8047,7 +8231,7 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
+@@ -7980,7 +8189,7 @@ static void check_preempt_wakeup(struct rq *rq, struct task_struct *p, int wake_
 	/*
 	 * XXX pick_eevdf(cfs_rq) != se ?
 	 */
@ -566,7 +619,7 @@ index d6042543c..e52c14232 100644
 		goto preempt;
 	return;
-@@ -8260,6 +8444,9 @@ static void yield_task_fair(struct rq *rq)
+@@ -8193,6 +8402,9 @@ static void yield_task_fair(struct rq *rq)
 	struct task_struct *curr = rq->curr;
 	struct cfs_rq *cfs_rq = task_cfs_rq(curr);
 	struct sched_entity *se = &curr->se;
@ -577,10 +630,10 @@ index d6042543c..e52c14232 100644
 	/*
 	 * Are we the only task in the tree?
 diff --git a/kernel/sched/features.h b/kernel/sched/features.h
-index 7d65b4029..bd274f7c7 100644
+index 54334ca5c5c6..416ec4bcdb0f 100644
 --- a/kernel/sched/features.h
 +++ b/kernel/sched/features.h
-@@ -13,7 +13,11 @@ SCHED_FEAT(PLACE_DEADLINE_INITIAL, true)
+@@ -12,7 +12,11 @@ SCHED_FEAT(PLACE_DEADLINE_INITIAL, true)
  * wakeup-preemption), since its likely going to consume data we
  * touched, increases cache locality.
  */
@ -593,10 +646,10 @@ index 7d65b4029..bd274f7c7 100644
 /*
  * Consider buddies to be cache hot, decreases the likeliness of a
 diff --git a/kernel/sched/sched.h b/kernel/sched/sched.h
-index 4236c4c89..714cc6ad9 100644
+index 67cd7e1fd501..04d065015d6c 100644
 --- a/kernel/sched/sched.h
 +++ b/kernel/sched/sched.h
-@@ -2510,6 +2510,7 @@ extern const_debug unsigned int sysctl_sched_nr_migrate;
+@@ -2506,6 +2506,7 @@ extern const_debug unsigned int sysctl_sched_nr_migrate;
 extern const_debug unsigned int sysctl_sched_migration_cost;
 extern unsigned int sysctl_sched_base_slice;
@ -605,4 +658,4 @@ index 4236c4c89..714cc6ad9 100644
 #ifdef CONFIG_SCHED_DEBUG
 extern int sysctl_resched_latency_warn_ms;
 -- 
-2.41.0.159.g0bfa463d37
+2.41.0
--- a/patches/0006-AMD-cppc.patch
+++ b/patches/0006-AMD-cppc.patch
@ -0,0 +1,573 @@
 From ab6268d199fa749e274a48b00c443538ae492b16 Mon Sep 17 00:00:00 2001
 From: Piotr Gorski <lucjan.lucjanov@gmail.com>
 Date: Wed, 9 Aug 2023 14:07:31 +0200
 Subject: [PATCH] amd-6.5: merge changes from dev tree
 Signed-off-by: Piotr Gorski <lucjan.lucjanov@gmail.com>
 ---
 .../admin-guide/kernel-parameters.txt         |   5 +
 Documentation/admin-guide/pm/amd-pstate.rst   |  55 +++++
 drivers/acpi/cppc_acpi.c                      |  13 ++
 drivers/acpi/processor_driver.c               |   6 +
 drivers/cpufreq/amd-pstate.c                  | 191 ++++++++++++++++--
 drivers/cpufreq/cpufreq.c                     |  13 ++
 include/acpi/cppc_acpi.h                      |   5 +
 include/linux/amd-pstate.h                    |   1 +
 include/linux/cpufreq.h                       |   4 +
 9 files changed, 272 insertions(+), 21 deletions(-)
 diff --git a/Documentation/admin-guide/kernel-parameters.txt b/Documentation/admin-guide/kernel-parameters.txt
 index a1457995f..1f53c395a 100644
 --- a/Documentation/admin-guide/kernel-parameters.txt
 +++ b/Documentation/admin-guide/kernel-parameters.txt
@@ -363,6 +363,11 @@
 			  selects a performance level in this range and appropriate
 			  to the current workload.
 +	amd_prefcore=
 +			[X86]
 +			enable
 +			  Enable AMD Pstate Preferred Core.
 +
 	amijoy.map=	[HW,JOY] Amiga joystick support
 			Map of devices attached to JOY0DAT and JOY1DAT
 			Format: <a>,<b>
 diff --git a/Documentation/admin-guide/pm/amd-pstate.rst b/Documentation/admin-guide/pm/amd-pstate.rst
 index 1cf40f692..4a30cf235 100644
 --- a/Documentation/admin-guide/pm/amd-pstate.rst
 +++ b/Documentation/admin-guide/pm/amd-pstate.rst
@@ -353,6 +353,49 @@ is activated.  In this mode, driver requests minimum and maximum performance
 level and the platform autonomously selects a performance level in this range
 and appropriate to the current workload.
 +AMD Pstate Preferred Core
 +=================================
 +
 +The core frequency is subjected to the process variation in semiconductors.
 +Not all cores are able to reach the maximum frequency respecting the
 +infrastructure limits. Consequently, AMD has redefined the concept of
 +maximum frequency of a part. This means that a fraction of cores can reach
 +maximum frequency. To find the best process scheduling policy for a given
 +scenario, OS needs to know the core ordering informed by the platform through
 +highest performance capability register of the CPPC interface.
 +
 +``AMD Pstate Preferred Core`` use ITMT arch provides functions and data structures
 +for enabling the scheduler to favor scheduling on cores can be get a higher frequency
 +with lower voltage under preferred core. And it has the ability to dynamically
 +change the preferred core based on the workload and platform conditions and
 +accounting for thermals and aging.
 +
 +The priority metric will be initialized by the AMD Pstate driver. The AMD Pstate
 +driver will also determine whether or not ``AMD Pstate Preferred Core`` is
 +supported by the platform.
 +
 +AMD Pstate driver will provide an initial core ordering when the system boots.
 +The platform uses the CPPC interfaces to communicate the core ranking to the
 +operating system and scheduler to make sure that OS is choosing the cores
 +with highest performance firstly for scheduling the process. When AMD Pstate
 +driver receives a message with the highest performance change, it will
 +update the core ranking and set the cpu's priority.
 +
 +AMD Preferred Core Switch
 +=================================
 +Kernel Parameters
 +-----------------
 +
 +``AMD Pstate Preferred Core`` has two states: enable and disable.
 +Enable/disable states can be chosen by different kernel parameters.
 +Default disable ``AMD Pstate Preferred Core``.
 +
 +``amd_prefcore=enable``
 +
 +If ``amd_prefcore=enable`` is passed to kernel command line option
 +then enable ``AMD Pstate Preferred Core`` if the processor and power
 +firmware can support preferred core feature.
 +
 User Space Interface in ``sysfs`` - General
 ===========================================
@@ -385,6 +428,18 @@ control its functionality at the system level.  They are located in the
         to the operation mode represented by that string - or to be
         unregistered in the "disable" case.
 +``prefcore_state``
 +	Preferred Core state of the driver: "enabled" or "disabled".
 +
 +	"enabled"
 +		Enable the AMD Preferred Core.
 +
 +	"disabled"
 +		Disable the AMD Preferred Core
 +
 +
 +        This attribute is read-only to check the state of Preferred Core.
 +
 ``cpupower`` tool support for ``amd-pstate``
 ===============================================
 diff --git a/drivers/acpi/cppc_acpi.c b/drivers/acpi/cppc_acpi.c
 index 7ff269a78..ad388a0e8 100644
 --- a/drivers/acpi/cppc_acpi.c
 +++ b/drivers/acpi/cppc_acpi.c
@@ -1154,6 +1154,19 @@ int cppc_get_nominal_perf(int cpunum, u64 *nominal_perf)
 	return cppc_get_perf(cpunum, NOMINAL_PERF, nominal_perf);
 }
 +/**
 + * cppc_get_highest_perf - Get the highest performance register value.
 + * @cpunum: CPU from which to get highest performance.
 + * @highest_perf: Return address.
 + *
 + * Return: 0 for success, -EIO otherwise.
 + */
 +int cppc_get_highest_perf(int cpunum, u64 *highest_perf)
 +{
 +	return cppc_get_perf(cpunum, HIGHEST_PERF, highest_perf);
 +}
 +EXPORT_SYMBOL_GPL(cppc_get_highest_perf);
 +
 /**
  * cppc_get_epp_perf - Get the epp register value.
  * @cpunum: CPU from which to get epp preference value.
 diff --git a/drivers/acpi/processor_driver.c b/drivers/acpi/processor_driver.c
 index 4bd16b3f0..29b2fb68a 100644
 --- a/drivers/acpi/processor_driver.c
 +++ b/drivers/acpi/processor_driver.c
@@ -27,6 +27,7 @@
 #define ACPI_PROCESSOR_NOTIFY_PERFORMANCE 0x80
 #define ACPI_PROCESSOR_NOTIFY_POWER	0x81
 #define ACPI_PROCESSOR_NOTIFY_THROTTLING	0x82
 +#define ACPI_PROCESSOR_NOTIFY_HIGEST_PERF_CHANGED	0x85
 MODULE_AUTHOR("Paul Diefenbaugh");
 MODULE_DESCRIPTION("ACPI Processor Driver");
@@ -83,6 +84,11 @@ static void acpi_processor_notify(acpi_handle handle, u32 event, void *data)
 		acpi_bus_generate_netlink_event(device->pnp.device_class,
 						  dev_name(&device->dev), event, 0);
 		break;
 +	case ACPI_PROCESSOR_NOTIFY_HIGEST_PERF_CHANGED:
 +		cpufreq_update_highest_perf(pr->id);
 +		acpi_bus_generate_netlink_event(device->pnp.device_class,
 +						  dev_name(&device->dev), event, 0);
 +		break;
 	default:
 		acpi_handle_debug(handle, "Unsupported event [0x%x]\n", event);
 		break;
 diff --git a/drivers/cpufreq/amd-pstate.c b/drivers/cpufreq/amd-pstate.c
 index 81fba0dcb..ba10aa971 100644
 --- a/drivers/cpufreq/amd-pstate.c
 +++ b/drivers/cpufreq/amd-pstate.c
@@ -37,6 +37,7 @@
 #include <linux/uaccess.h>
 #include <linux/static_call.h>
 #include <linux/amd-pstate.h>
 +#include <linux/topology.h>
 #include <acpi/processor.h>
 #include <acpi/cppc_acpi.h>
@@ -49,6 +50,8 @@
 #define AMD_PSTATE_TRANSITION_LATENCY	20000
 #define AMD_PSTATE_TRANSITION_DELAY	1000
 +#define AMD_PSTATE_PREFCORE_THRESHOLD	166
 +#define AMD_PSTATE_MAX_CPPC_PERF	255
 /*
  * TODO: We need more time to fine tune processors with shared memory solution
@@ -65,6 +68,14 @@ static struct cpufreq_driver amd_pstate_epp_driver;
 static int cppc_state = AMD_PSTATE_UNDEFINED;
 static bool cppc_enabled;
 +/*
 + * CPPC Preferred Core feature is supported by power firmware
 + */
 +static bool prefcore_enabled = false;
 +
 +/* Disable AMD Pstate Preferred Core loading */
 +static bool no_prefcore __read_mostly = true;
 +
 /*
  * AMD Energy Preference Performance (EPP)
  * The EPP is used in the CCLK DPM controller to drive
@@ -290,27 +301,26 @@ static inline int amd_pstate_enable(bool enable)
 static int pstate_init_perf(struct amd_cpudata *cpudata)
 {
 	u64 cap1;
 -	u32 highest_perf;
 	int ret = rdmsrl_safe_on_cpu(cpudata->cpu, MSR_AMD_CPPC_CAP1,
 				     &cap1);
 	if (ret)
 		return ret;
 -	/*
 -	 * TODO: Introduce AMD specific power feature.
 -	 *
 -	 * CPPC entry doesn't indicate the highest performance in some ASICs.
 +	/* For platforms that do not support the preferred core feature, the
 +	 * highest_pef may be configured with 166 or 255, to avoid max frequency
 +	 * calculated wrongly. we take the AMD_CPPC_HIGHEST_PERF(cap1) value as
 +	 * the default max perf.
 	 */
 -	highest_perf = amd_get_highest_perf();
 -	if (highest_perf > AMD_CPPC_HIGHEST_PERF(cap1))
 -		highest_perf = AMD_CPPC_HIGHEST_PERF(cap1);
 -
 -	WRITE_ONCE(cpudata->highest_perf, highest_perf);
 +	if (!prefcore_enabled)
 +		WRITE_ONCE(cpudata->highest_perf, AMD_CPPC_HIGHEST_PERF(cap1));
 +	else
 +		WRITE_ONCE(cpudata->highest_perf, AMD_PSTATE_PREFCORE_THRESHOLD);
 	WRITE_ONCE(cpudata->nominal_perf, AMD_CPPC_NOMINAL_PERF(cap1));
 	WRITE_ONCE(cpudata->lowest_nonlinear_perf, AMD_CPPC_LOWNONLIN_PERF(cap1));
 	WRITE_ONCE(cpudata->lowest_perf, AMD_CPPC_LOWEST_PERF(cap1));
 +	WRITE_ONCE(cpudata->prefcore_highest_perf, AMD_CPPC_HIGHEST_PERF(cap1));
 	return 0;
 }
@@ -318,22 +328,21 @@ static int pstate_init_perf(struct amd_cpudata *cpudata)
 static int cppc_init_perf(struct amd_cpudata *cpudata)
 {
 	struct cppc_perf_caps cppc_perf;
 -	u32 highest_perf;
 	int ret = cppc_get_perf_caps(cpudata->cpu, &cppc_perf);
 	if (ret)
 		return ret;
 -	highest_perf = amd_get_highest_perf();
 -	if (highest_perf > cppc_perf.highest_perf)
 -		highest_perf = cppc_perf.highest_perf;
 -
 -	WRITE_ONCE(cpudata->highest_perf, highest_perf);
 +	if (!prefcore_enabled)
 +		WRITE_ONCE(cpudata->highest_perf, cppc_perf.highest_perf);
 +	else
 +		WRITE_ONCE(cpudata->highest_perf, AMD_PSTATE_PREFCORE_THRESHOLD);
 	WRITE_ONCE(cpudata->nominal_perf, cppc_perf.nominal_perf);
 	WRITE_ONCE(cpudata->lowest_nonlinear_perf,
 		   cppc_perf.lowest_nonlinear_perf);
 	WRITE_ONCE(cpudata->lowest_perf, cppc_perf.lowest_perf);
 +	WRITE_ONCE(cpudata->prefcore_highest_perf, cppc_perf.highest_perf);
 	if (cppc_state == AMD_PSTATE_ACTIVE)
 		return 0;
@@ -676,6 +685,118 @@ static void amd_perf_ctl_reset(unsigned int cpu)
 	wrmsrl_on_cpu(cpu, MSR_AMD_PERF_CTL, 0);
 }
 +/*
 + * Set AMD Pstate Preferred Core enable can't be done directly from cpufreq callbacks
 + * due to locking, so queue the work for later.
 + */
 +static void amd_pstste_sched_prefcore_workfn(struct work_struct *work)
 +{
 +	sched_set_itmt_support();
 +}
 +static DECLARE_WORK(sched_prefcore_work, amd_pstste_sched_prefcore_workfn);
 +
 +/**
 + * Get the highest performance register value.
 + * @cpu: CPU from which to get highest performance.
 + * @highest_perf: Return address.
 + *
 + * Return: 0 for success, -EIO otherwise.
 + */
 +static int amd_pstate_get_highest_perf(int cpu, u64 *highest_perf)
 +{
 +       int ret;
 +
 +       if (boot_cpu_has(X86_FEATURE_CPPC)) {
 +               u64 cap1;
 +
 +               ret = rdmsrl_safe_on_cpu(cpu, MSR_AMD_CPPC_CAP1, &cap1);
 +               if (ret)
 +                       return ret;
 +               WRITE_ONCE(*highest_perf, AMD_CPPC_HIGHEST_PERF(cap1));
 +       } else {
 +               ret = cppc_get_highest_perf(cpu, highest_perf);
 +       }
 +
 +       return (ret);
 +}
 +
 +static void amd_pstate_init_prefcore(void)
 +{
 +	int cpu, ret;
 +	u64 highest_perf;
 +
 +	if (no_prefcore)
 +		return;
 +
 +	for_each_possible_cpu(cpu) {
 +		ret = amd_pstate_get_highest_perf(cpu, &highest_perf);
 +		if (ret)
 +			break;
 +
 +		sched_set_itmt_core_prio(highest_perf, cpu);
 +	}
 +
 +	/*
 +	 * This code can be run during CPU online under the
 +	 * CPU hotplug locks, so sched_set_amd_prefcore_support()
 +	 * cannot be called from here.  Queue up a work item
 +	 * to invoke it.
 +	 */
 +	schedule_work(&sched_prefcore_work);
 +}
 +
 +static void amd_pstate_update_highest_perf(unsigned int cpu)
 +{
 +	struct cpufreq_policy *policy;
 +	struct amd_cpudata *cpudata;
 +	u32 prev_high = 0, cur_high = 0;
 +	u64 highest_perf;
 +	int ret;
 +
 +	if (!prefcore_enabled)
 +		return;
 +
 +	ret = amd_pstate_get_highest_perf(cpu, &highest_perf);
 +	if (ret)
 +		return;
 +
 +	policy = cpufreq_cpu_get(cpu);
 +	cpudata = policy->driver_data;
 +	cur_high = highest_perf;
 +	prev_high = READ_ONCE(cpudata->prefcore_highest_perf);
 +
 +	if (prev_high != cur_high) {
 +		WRITE_ONCE(cpudata->prefcore_highest_perf, cur_high);
 +		sched_set_itmt_core_prio(cur_high, cpu);
 +	}
 +
 +	cpufreq_cpu_put(policy);
 +}
 +
 +/*
 + * Check if AMD Pstate Preferred core feature is supported and enabled
 + * 1) no_prefcore is used to enable or disable AMD Pstate Preferred Core
 + * loading when user would like to enable or disable it. Without that,
 + * AMD Pstate Preferred Core will be disabled by default if the processor
 + * and power firmware can support preferred core feature.
 + * 2) prefcore_enabled is used to indicate whether CPPC preferred core is enabled.
 + */
 +static void check_prefcore_supported(int cpu)
 +{
 +	u64 highest_perf;
 +	int ret;
 +
 +	if (no_prefcore)
 +		return;
 +
 +	ret = amd_pstate_get_highest_perf(cpu, &highest_perf);
 +	if (ret)
 +		return;
 +
 +	if(highest_perf < AMD_PSTATE_MAX_CPPC_PERF)
 +		prefcore_enabled = true;
 +}
 +
 static int amd_pstate_cpu_init(struct cpufreq_policy *policy)
 {
 	int min_freq, max_freq, nominal_freq, lowest_nonlinear_freq, ret;
@@ -697,6 +818,9 @@ static int amd_pstate_cpu_init(struct cpufreq_policy *policy)
 	cpudata->cpu = policy->cpu;
 +	/* check if CPPC preferred core feature is enabled*/
 +	check_prefcore_supported(policy->cpu);
 +
 	ret = amd_pstate_init_perf(cpudata);
 	if (ret)
 		goto free_cpudata1;
@@ -1012,8 +1136,8 @@ static int amd_pstate_update_status(const char *buf, size_t size)
 	return 0;
 }
 -static ssize_t show_status(struct kobject *kobj,
 -			   struct kobj_attribute *attr, char *buf)
 +static ssize_t status_show(struct device *dev,
 +			   struct device_attribute *attr, char *buf)
 {
 	ssize_t ret;
@@ -1024,7 +1148,7 @@ static ssize_t show_status(struct kobject *kobj,
 	return ret;
 }
 -static ssize_t store_status(struct kobject *a, struct kobj_attribute *b,
 +static ssize_t status_store(struct device *a, struct device_attribute *b,
 			    const char *buf, size_t count)
 {
 	char *p = memchr(buf, '\n', count);
@@ -1037,13 +1161,20 @@ static ssize_t store_status(struct kobject *a, struct kobj_attribute *b,
 	return ret < 0 ? ret : count;
 }
 +static ssize_t prefcore_state_show(struct device *dev,
 +				   struct device_attribute *attr, char *buf)
 +{
 +	return sysfs_emit(buf, "%s\n", prefcore_enabled ? "enabled" : "disabled");
 +}
 +
 cpufreq_freq_attr_ro(amd_pstate_max_freq);
 cpufreq_freq_attr_ro(amd_pstate_lowest_nonlinear_freq);
 cpufreq_freq_attr_ro(amd_pstate_highest_perf);
 cpufreq_freq_attr_rw(energy_performance_preference);
 cpufreq_freq_attr_ro(energy_performance_available_preferences);
 -define_one_global_rw(status);
 +static DEVICE_ATTR_RW(status);
 +static DEVICE_ATTR_RO(prefcore_state);
 static struct freq_attr *amd_pstate_attr[] = {
 	&amd_pstate_max_freq,
@@ -1062,7 +1193,8 @@ static struct freq_attr *amd_pstate_epp_attr[] = {
 };
 static struct attribute *pstate_global_attributes[] = {
 -	&status.attr,
 +	&dev_attr_status.attr,
 +	&dev_attr_prefcore_state.attr,
 	NULL
 };
@@ -1114,6 +1246,9 @@ static int amd_pstate_epp_cpu_init(struct cpufreq_policy *policy)
 	cpudata->cpu = policy->cpu;
 	cpudata->epp_policy = 0;
 +	/* check if CPPC preferred core feature is supported*/
 +	check_prefcore_supported(policy->cpu);
 +
 	ret = amd_pstate_init_perf(cpudata);
 	if (ret)
 		goto free_cpudata1;
@@ -1392,6 +1527,7 @@ static struct cpufreq_driver amd_pstate_driver = {
 	.suspend	= amd_pstate_cpu_suspend,
 	.resume		= amd_pstate_cpu_resume,
 	.set_boost	= amd_pstate_set_boost,
 +	.update_highest_perf	= amd_pstate_update_highest_perf,
 	.name		= "amd-pstate",
 	.attr		= amd_pstate_attr,
 };
@@ -1406,6 +1542,7 @@ static struct cpufreq_driver amd_pstate_epp_driver = {
 	.online		= amd_pstate_epp_cpu_online,
 	.suspend	= amd_pstate_epp_suspend,
 	.resume		= amd_pstate_epp_resume,
 +	.update_highest_perf	= amd_pstate_update_highest_perf,
 	.name		= "amd-pstate-epp",
 	.attr		= amd_pstate_epp_attr,
 };
@@ -1506,6 +1643,8 @@ static int __init amd_pstate_init(void)
 		}
 	}
 +	amd_pstate_init_prefcore();
 +
 	return ret;
 global_attr_free:
@@ -1527,7 +1666,17 @@ static int __init amd_pstate_param(char *str)
 	return amd_pstate_set_driver(mode_idx);
 }
 +
 +static int __init amd_prefcore_param(char *str)
 +{
 +	if (!strcmp(str, "enable"))
 +		no_prefcore = false;
 +
 +	return 0;
 +}
 +
 early_param("amd_pstate", amd_pstate_param);
 +early_param("amd_prefcore", amd_prefcore_param);
 MODULE_AUTHOR("Huang Rui <ray.huang@amd.com>");
 MODULE_DESCRIPTION("AMD Processor P-state Frequency Driver");
 diff --git a/drivers/cpufreq/cpufreq.c b/drivers/cpufreq/cpufreq.c
 index 50bbc969f..842357abf 100644
 --- a/drivers/cpufreq/cpufreq.c
 +++ b/drivers/cpufreq/cpufreq.c
@@ -2675,6 +2675,19 @@ void cpufreq_update_limits(unsigned int cpu)
 }
 EXPORT_SYMBOL_GPL(cpufreq_update_limits);
 +/**
 + * cpufreq_update_highest_perf - Update highest performance for a given CPU.
 + * @cpu: CPU to update the highest performance for.
 + *
 + * Invoke the driver's ->update_highest_perf callback if present
 + */
 +void cpufreq_update_highest_perf(unsigned int cpu)
 +{
 +	if (cpufreq_driver->update_highest_perf)
 +		cpufreq_driver->update_highest_perf(cpu);
 +}
 +EXPORT_SYMBOL_GPL(cpufreq_update_highest_perf);
 +
 /*********************************************************************
  *               BOOST						     *
  *********************************************************************/
 diff --git a/include/acpi/cppc_acpi.h b/include/acpi/cppc_acpi.h
 index 6126c977e..c0b69ffe7 100644
 --- a/include/acpi/cppc_acpi.h
 +++ b/include/acpi/cppc_acpi.h
@@ -139,6 +139,7 @@ struct cppc_cpudata {
 #ifdef CONFIG_ACPI_CPPC_LIB
 extern int cppc_get_desired_perf(int cpunum, u64 *desired_perf);
 extern int cppc_get_nominal_perf(int cpunum, u64 *nominal_perf);
 +extern int cppc_get_highest_perf(int cpunum, u64 *highest_perf);
 extern int cppc_get_perf_ctrs(int cpu, struct cppc_perf_fb_ctrs *perf_fb_ctrs);
 extern int cppc_set_perf(int cpu, struct cppc_perf_ctrls *perf_ctrls);
 extern int cppc_set_enable(int cpu, bool enable);
@@ -165,6 +166,10 @@ static inline int cppc_get_nominal_perf(int cpunum, u64 *nominal_perf)
 {
 	return -ENOTSUPP;
 }
 +static inline int cppc_get_highest_perf(int cpunum, u64 *highest_perf)
 +{
 +	return -ENOTSUPP;
 +}
 static inline int cppc_get_perf_ctrs(int cpu, struct cppc_perf_fb_ctrs *perf_fb_ctrs)
 {
 	return -ENOTSUPP;
 diff --git a/include/linux/amd-pstate.h b/include/linux/amd-pstate.h
 index 446394f84..fa86bc953 100644
 --- a/include/linux/amd-pstate.h
 +++ b/include/linux/amd-pstate.h
@@ -70,6 +70,7 @@ struct amd_cpudata {
 	u32	nominal_perf;
 	u32	lowest_nonlinear_perf;
 	u32	lowest_perf;
 +	u32     prefcore_highest_perf;
 	u32	max_freq;
 	u32	min_freq;
 diff --git a/include/linux/cpufreq.h b/include/linux/cpufreq.h
 index 172ff51c1..766c83a4f 100644
 --- a/include/linux/cpufreq.h
 +++ b/include/linux/cpufreq.h
@@ -231,6 +231,7 @@ int cpufreq_get_policy(struct cpufreq_policy *policy, unsigned int cpu);
 void refresh_frequency_limits(struct cpufreq_policy *policy);
 void cpufreq_update_policy(unsigned int cpu);
 void cpufreq_update_limits(unsigned int cpu);
 +void cpufreq_update_highest_perf(unsigned int cpu);
 bool have_governor_per_policy(void);
 bool cpufreq_supports_freq_invariance(void);
 struct kobject *get_governor_parent_kobj(struct cpufreq_policy *policy);
@@ -376,6 +377,9 @@ struct cpufreq_driver {
 	/* Called to update policy limits on firmware notifications. */
 	void		(*update_limits)(unsigned int cpu);
 +	/* Called to update highest performance on firmware notifications. */
 +	void		(*update_highest_perf)(unsigned int cpu);
 +
 	/* optional */
 	int		(*bios_limit)(int cpu, unsigned int *limit);
 -- 
 2.42.0.rc0.25.ga82fb66fed
--- a/scripts/patch.sh
+++ b/scripts/patch.sh
@ -16,3 +16,5 @@ patch -Np1 < "../patches/0002-eevdfbore.patch"
 patch -Np1 < "../patches/0004-Allow-to-set-custom-USB-pollrate-for-specific-device.patch"
 # Allow pre polaris cards to use the amdgpu kernel module
 patch -Np1 < "../patches/0005-amdgpu-si-cik-default.patch"
 # AMD Patch for CPPC
 patch -Np1 < "../patches/0006-AMD-cppc.patch"
--- a/scripts/source.sh
+++ b/scripts/source.sh
@ -2,7 +2,7 @@
 echo "Pika Kernel - Getting source"
-wget -nv https://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git/snapshot/linux-6.5-rc3.tar.gz
+wget -nv https://git.kernel.org/pub/scm/linux/kernel/git/torvalds/linux.git/snapshot/linux-6.5-rc5.tar.gz
-tar -xf ./linux-6.5-rc3.tar.gz
+tar -xf ./linux-6.5-rc5.tar.gz
-cd linux-6.5-rc3
+cd linux-6.5-rc5