diff options
| author | Davide Garberi <dade.garberi@gmail.com> | 2023-08-06 15:31:30 +0200 | 
|---|---|---|
| committer | Davide Garberi <dade.garberi@gmail.com> | 2023-08-06 15:31:30 +0200 | 
| commit | cc57cb4ee3b7918b74d30604735d353b9a5fa23b (patch) | |
| tree | 0be483b86472eaf1c74f747ecbaf6300f3998a1a /kernel/sched/core.c | |
| parent | 44be99a74546fb018cbf2049602a5fd2889a0089 (diff) | |
| parent | 7d11b1a7a11c598a07687f853ded9eca97d89043 (diff) | |
Merge lineage-20 of git@github.com:LineageOS/android_kernel_qcom_msm8998.git into lineage-20
7d11b1a7a11c Revert "sched: cpufreq: Use sched_clock instead of rq_clock when updating schedutil"
daaa5da96a74 sched: Take irq_sparse lock during the isolation
217ab2d0ef91 rcu: Speed up calling of RCU tasks callbacks
997b726bc092 kernel: power: Workaround for sensor ipc message causing high power consume
b933e4d37bc0 sched/fair: Fix low cpu usage with high throttling by removing expiration of cpu-local slices
82d3f23d6dc5 sched/fair: Fix bandwidth timer clock drift condition
629bfed360f9 kernel: power: qos: remove check for core isolation while cluster LPMs
891a63210e1d sched/fair: Fix issue where frequency update not skipped
b775cb29f663 ANDROID: Move schedtune en/dequeue before schedutil update triggers
ebdb82f7b34a sched/fair: Skip frequency updates if CPU about to idle
ff383d94478a FROMLIST: sched: Make iowait_boost optional in schedutil
9539942cb065 FROMLIST: cpufreq: Make iowait boost a policy option
b65c91c9aa14 ARM: dts: msm: add HW CPU's busy-cost-data for additional freqs
72f13941085b ARM: dts: msm: fix CPU's idle-cost-data
ab88411382f7 ARM: dts: msm: fix EM to be monotonically increasing
83dcbae14782 ARM: dts: msm: Fix EAS idle-cost-data property length
33d3b17bfdfb ARM: dts: msm: Add msm8998 energy model
c0fa7577022c sched/walt: Re-add code to allow WALT to function
d5cd35f38616 FROMGIT: binder: use EINTR for interrupted wait for work
db74739c86de sched: Don't fail isolation request for an already isolated CPU
aee7a16e347b sched: WALT: increase WALT minimum window size to 20ms
4dbe44554792 sched: cpufreq: Use per_cpu_ptr instead of this_cpu_ptr when reporting load
ef3fb04c7df4 sched: cpufreq: Use sched_clock instead of rq_clock when updating schedutil
c7128748614a sched/cpupri: Exclude isolated CPUs from the lowest_mask
6adb092856e8 sched: cpufreq: Limit governor updates to WALT changes alone
0fa652ee00f5 sched: walt: Correct WALT window size initialization
41cbb7bc59fb sched: walt: fix window misalignment when HZ=300
43cbf9d6153d sched/tune: Increase the cgroup limit to 6
c71b8fffe6b3 drivers: cpuidle: lpm-levels: Fix KW issues with idle state idx < 0
938e42ca699f drivers: cpuidle: lpm-levels: Correctly check for list empty
8d8a48aecde5 sched/fair: Fix load_balance() affinity redo path
eccc8acbe705 sched/fair: Avoid unnecessary active load balance
0ffdb886996b BACKPORT: sched/core: Fix rules for running on online && !active CPUs
c9999f04236e sched/core: Allow kthreads to fall back to online && !active cpus
b9b6bc6ea3c0 sched: Allow migrating kthreads into online but inactive CPUs
a9314f9d8ad4 sched/fair: Allow load bigger task load balance when nr_running is 2
c0b317c27d44 pinctrl: qcom: Clear status bit on irq_unmask
45df1516d04a UPSTREAM: mm: fix misplaced unlock_page in do_wp_page()
899def5edcd4 UPSTREAM: mm/ksm: Remove reuse_ksm_page()
46c6fbdd185a BACKPORT: mm: do_wp_page() simplification
90dccbae4c04 UPSTREAM: mm: reuse only-pte-mapped KSM page in do_wp_page()
ebf270d24640 sched/fair: vruntime should normalize when switching from  fair
cbe0b37059c9 mm: introduce arg_lock to protect arg_start|end and  env_start|end in mm_struct
12d40f1995b4 msm: mdss: Fix indentation
620df03a7229 msm: mdss: Treat polling_en as the bool that it is
12af218146a6 msm: mdss: add idle state node
13e661759656 cpuset: Restore tasks affinity while moving across cpusets
602bf4096dab genirq: Honour IRQ's affinity hint during migration
9209b5556f6a power: qos: Use effective affinity mask
f31078b5825f genirq: Introduce effective affinity mask
58c453484f7e sched/cputime: Mitigate performance regression in times()/clock_gettime()
400383059868 kernel: time: Add delay after cpu_relax() in tight loops
1daa7ea39076 pinctrl: qcom: Update irq handle for GPIO pins
07f7c9961c7c power: smb-lib: Fix mutex acquisition deadlock on PD hard reset
094b738f46c8 power: qpnp-smb2: Implement battery charging_enabled node
d6038d6da57f ASoC: msm-pcm-q6-v2: Add dsp buf check
0d7a6c301af8 qcacld-3.0: Fix OOB in wma_scan_roam.c
Change-Id: Ia2e189e37daad6e99bdb359d1204d9133a7916f4
Diffstat (limited to 'kernel/sched/core.c')
| -rw-r--r-- | kernel/sched/core.c | 100 | 
1 files changed, 87 insertions, 13 deletions
| diff --git a/kernel/sched/core.c b/kernel/sched/core.c index 40a44876c74c..a8d2c50737ee 100644 --- a/kernel/sched/core.c +++ b/kernel/sched/core.c @@ -78,6 +78,7 @@  #include <linux/irq.h>  #include <linux/sched/core_ctl.h>  #include <linux/cpufreq_times.h> +#include <linux/prefetch.h>  #include <asm/switch_to.h>  #include <asm/tlb.h> @@ -97,6 +98,7 @@  #define CREATE_TRACE_POINTS  #include <trace/events/sched.h> +#include "walt.h"  ATOMIC_NOTIFIER_HEAD(load_alert_notifier_head); @@ -1084,6 +1086,33 @@ void check_preempt_curr(struct rq *rq, struct task_struct *p, int flags)  }  #ifdef CONFIG_SMP + +static inline bool is_per_cpu_kthread(struct task_struct *p) +{ +	if (!(p->flags & PF_KTHREAD)) +		return false; + +	if (p->nr_cpus_allowed != 1) +		return false; + +	return true; +} + +/* + * Per-CPU kthreads are allowed to run on !actie && online CPUs, see + * __set_cpus_allowed_ptr() and select_fallback_rq(). + */ +static inline bool is_cpu_allowed(struct task_struct *p, int cpu) +{ +	if (!cpumask_test_cpu(cpu, &p->cpus_allowed)) +		return false; + +	if (is_per_cpu_kthread(p)) +		return cpu_online(cpu); + +	return cpu_active(cpu); +} +  /*   * This is how migration works:   * @@ -1143,11 +1172,8 @@ static struct rq *__migrate_task(struct rq *rq, struct task_struct *p, int dest_  {  	int src_cpu; -	if (unlikely(!cpu_active(dest_cpu))) -		return rq; -  	/* Affinity changed (again). */ -	if (!cpumask_test_cpu(dest_cpu, tsk_cpus_allowed(p))) +	if (!is_cpu_allowed(p, dest_cpu))  		return rq;  	src_cpu = cpu_of(rq); @@ -1364,6 +1390,7 @@ void set_task_cpu(struct task_struct *p, unsigned int new_cpu)  		p->se.nr_migrations++;  		perf_event_task_migrate(p); +		walt_fixup_busy_time(p, new_cpu);  		fixup_busy_time(p, new_cpu);  	} @@ -1648,9 +1675,7 @@ static int select_fallback_rq(int cpu, struct task_struct *p, bool allow_iso)  	for (;;) {  		/* Any allowed, online CPU? */  		for_each_cpu(dest_cpu, tsk_cpus_allowed(p)) { -			if (!cpu_online(dest_cpu)) -				continue; -			if (!cpu_active(dest_cpu)) +			if (!is_cpu_allowed(p, dest_cpu))  				continue;  			if (cpu_isolated(dest_cpu)) {  				if (allow_iso) @@ -2132,6 +2157,9 @@ try_to_wake_up(struct task_struct *p, unsigned int state, int wake_flags,  	raw_spin_lock(&rq->lock);  	old_load = task_load(p); +	wallclock = walt_ktime_clock(); +	walt_update_task_ravg(rq->curr, rq, TASK_UPDATE, wallclock, 0); +	walt_update_task_ravg(p, rq, TASK_WAKE, wallclock, 0);  	wallclock = sched_ktime_clock();  	update_task_ravg(rq->curr, rq, TASK_UPDATE, wallclock, 0);  	update_task_ravg(p, rq, TASK_WAKE, wallclock, 0); @@ -2230,6 +2258,11 @@ static void try_to_wake_up_local(struct task_struct *p)  		update_task_ravg(rq->curr, rq, TASK_UPDATE, wallclock, 0);  		update_task_ravg(p, rq, TASK_WAKE, wallclock, 0);  		cpufreq_update_util(rq, 0); + +		wallclock = walt_ktime_clock(); + +		walt_update_task_ravg(rq->curr, rq, TASK_UPDATE, wallclock, 0); +		walt_update_task_ravg(p, rq, TASK_WAKE, wallclock, 0);  		ttwu_activate(rq, p, ENQUEUE_WAKEUP);  		note_task_waking(p, wallclock);  	} @@ -2362,6 +2395,7 @@ static void __sched_fork(unsigned long clone_flags, struct task_struct *p)  #endif  	INIT_LIST_HEAD(&p->se.group_node); +	walt_init_new_task_load(p);  #ifdef CONFIG_FAIR_GROUP_SCHED  	p->se.cfs_rq			= NULL; @@ -2646,6 +2680,7 @@ void wake_up_new_task(struct task_struct *p)  	struct rq *rq;  	add_new_task_to_grp(p); +	walt_init_new_task_load(p);  	raw_spin_lock_irqsave(&p->pi_lock, flags);  	p->state = TASK_RUNNING; @@ -2664,6 +2699,7 @@ void wake_up_new_task(struct task_struct *p)  #endif  	rq = __task_rq_lock(p);  	mark_task_starting(p); +	walt_mark_task_starting(p);  	update_rq_clock(rq);  	post_init_entity_util_avg(&p->se);  	activate_task(rq, p, ENQUEUE_WAKEUP_NEW); @@ -3134,6 +3170,23 @@ EXPORT_PER_CPU_SYMBOL(kstat);  EXPORT_PER_CPU_SYMBOL(kernel_cpustat);  /* + * The function fair_sched_class.update_curr accesses the struct curr + * and its field curr->exec_start; when called from task_sched_runtime(), + * we observe a high rate of cache misses in practice. + * Prefetching this data results in improved performance. + */ +static inline void prefetch_curr_exec_start(struct task_struct *p) +{ +#ifdef CONFIG_FAIR_GROUP_SCHED +	struct sched_entity *curr = (&p->se)->cfs_rq->curr; +#else +	struct sched_entity *curr = (&task_rq(p)->cfs)->curr; +#endif +	prefetch(curr); +	prefetch(&curr->exec_start); +} + +/*   * Return accounted runtime for the task.   * In case the task is currently running, return the runtime plus current's   * pending runtime that have not been accounted yet. @@ -3167,6 +3220,7 @@ unsigned long long task_sched_runtime(struct task_struct *p)  	 * thread, breaking clock_gettime().  	 */  	if (task_current(rq, p) && task_on_rq_queued(p)) { +		prefetch_curr_exec_start(p);  		update_rq_clock(rq);  		p->sched_class->update_curr(rq);  	} @@ -3194,10 +3248,13 @@ void scheduler_tick(void)  	raw_spin_lock(&rq->lock);  	old_load = task_load(curr); +	walt_set_window_start(rq);  	set_window_start(rq);  	update_rq_clock(rq);  	curr->sched_class->task_tick(rq, curr, 0);  	update_cpu_load_active(rq); +	walt_update_task_ravg(rq->curr, rq, TASK_UPDATE, +			walt_ktime_clock(), 0);  	calc_global_load_tick(rq);  	wallclock = sched_ktime_clock();  	update_task_ravg(rq->curr, rq, TASK_UPDATE, wallclock, 0); @@ -3561,6 +3618,9 @@ static void __sched notrace __schedule(bool preempt)  		update_rq_clock(rq);  	next = pick_next_task(rq, prev); +	wallclock = walt_ktime_clock(); +	walt_update_task_ravg(prev, rq, PUT_PREV_TASK, wallclock, 0); +	walt_update_task_ravg(next, rq, PICK_NEXT_TASK, wallclock, 0);  	clear_tsk_need_resched(prev);  	clear_preempt_need_resched();  	rq->clock_skip_update = 0; @@ -4902,6 +4962,9 @@ again:  		retval = -EINVAL;  	} +	if (!retval && !(p->flags & PF_KTHREAD)) +		cpumask_and(&p->cpus_requested, in_mask, cpu_possible_mask); +  out_free_new_mask:  	free_cpumask_var(new_mask);  out_free_cpus_allowed: @@ -5923,12 +5986,6 @@ int sched_isolate_cpu(int cpu)  	cpumask_andnot(&avail_cpus, cpu_online_mask, cpu_isolated_mask); -	/* We cannot isolate ALL cpus in the system */ -	if (cpumask_weight(&avail_cpus) == 1) { -		ret_code = -EINVAL; -		goto out; -	} -  	if (!cpu_online(cpu)) {  		ret_code = -EINVAL;  		goto out; @@ -5937,6 +5994,13 @@ int sched_isolate_cpu(int cpu)  	if (++cpu_isolation_vote[cpu] > 1)  		goto out; +	/* We cannot isolate ALL cpus in the system */ +	if (cpumask_weight(&avail_cpus) == 1) { +		--cpu_isolation_vote[cpu]; +		ret_code = -EINVAL; +		goto out; +	} +  	/*  	 * There is a race between watchdog being enabled by hotplug and  	 * core isolation disabling the watchdog. When a CPU is hotplugged in @@ -5960,7 +6024,9 @@ int sched_isolate_cpu(int cpu)  	smp_call_function_any(&avail_cpus, hrtimer_quiesce_cpu, &cpu, 1);  	smp_call_function_any(&avail_cpus, timer_quiesce_cpu, &cpu, 1); +	irq_lock_sparse();  	stop_cpus(cpumask_of(cpu), do_isolation_work_cpu_stop, 0); +	irq_unlock_sparse();  	calc_load_migrate(rq);  	update_max_interval(); @@ -6319,6 +6385,7 @@ migration_call(struct notifier_block *nfb, unsigned long action, void *hcpu)  	case CPU_UP_PREPARE:  		raw_spin_lock_irqsave(&rq->lock, flags); +		walt_set_window_start(rq);  		set_window_start(rq);  		raw_spin_unlock_irqrestore(&rq->lock, flags);  		rq->calc_load_update = calc_load_update; @@ -6340,6 +6407,7 @@ migration_call(struct notifier_block *nfb, unsigned long action, void *hcpu)  		sched_ttwu_pending();  		/* Update our root-domain */  		raw_spin_lock_irqsave(&rq->lock, flags); +		walt_migrate_sync_cpu(cpu);  		if (rq->rd) {  			BUG_ON(!cpumask_test_cpu(cpu, rq->rd->span)); @@ -8325,6 +8393,7 @@ void __init sched_init_smp(void)  	/* Move init over to a non-isolated CPU */  	if (set_cpus_allowed_ptr(current, non_isolated_cpus) < 0)  		BUG(); +	cpumask_copy(¤t->cpus_requested, cpu_possible_mask);  	sched_init_granularity();  	free_cpumask_var(non_isolated_cpus); @@ -8534,6 +8603,11 @@ void __init sched_init(void)  		}  #endif  		rq->max_idle_balance_cost = sysctl_sched_migration_cost; +#ifdef CONFIG_SCHED_WALT +		rq->cur_irqload = 0; +		rq->avg_irqload = 0; +		rq->irqload_ts = 0; +#endif  		INIT_LIST_HEAD(&rq->cfs_tasks); | 
