xref: /OK3568_Linux_fs/kernel/mm/damon/core.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Data Access Monitor
4*4882a593Smuzhiyun  *
5*4882a593Smuzhiyun  * Author: SeongJae Park <sjpark@amazon.de>
6*4882a593Smuzhiyun  */
7*4882a593Smuzhiyun 
8*4882a593Smuzhiyun #define pr_fmt(fmt) "damon: " fmt
9*4882a593Smuzhiyun 
10*4882a593Smuzhiyun #include <linux/damon.h>
11*4882a593Smuzhiyun #include <linux/delay.h>
12*4882a593Smuzhiyun #include <linux/kthread.h>
13*4882a593Smuzhiyun #include <linux/mm.h>
14*4882a593Smuzhiyun #include <linux/slab.h>
15*4882a593Smuzhiyun #include <linux/string.h>
16*4882a593Smuzhiyun 
17*4882a593Smuzhiyun #define CREATE_TRACE_POINTS
18*4882a593Smuzhiyun #include <trace/events/damon.h>
19*4882a593Smuzhiyun 
20*4882a593Smuzhiyun #ifdef CONFIG_DAMON_KUNIT_TEST
21*4882a593Smuzhiyun #undef DAMON_MIN_REGION
22*4882a593Smuzhiyun #define DAMON_MIN_REGION 1
23*4882a593Smuzhiyun #endif
24*4882a593Smuzhiyun 
25*4882a593Smuzhiyun static DEFINE_MUTEX(damon_lock);
26*4882a593Smuzhiyun static int nr_running_ctxs;
27*4882a593Smuzhiyun 
28*4882a593Smuzhiyun /*
29*4882a593Smuzhiyun  * Construct a damon_region struct
30*4882a593Smuzhiyun  *
31*4882a593Smuzhiyun  * Returns the pointer to the new struct if success, or NULL otherwise
32*4882a593Smuzhiyun  */
damon_new_region(unsigned long start,unsigned long end)33*4882a593Smuzhiyun struct damon_region *damon_new_region(unsigned long start, unsigned long end)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun 	struct damon_region *region;
36*4882a593Smuzhiyun 
37*4882a593Smuzhiyun 	region = kmalloc(sizeof(*region), GFP_KERNEL);
38*4882a593Smuzhiyun 	if (!region)
39*4882a593Smuzhiyun 		return NULL;
40*4882a593Smuzhiyun 
41*4882a593Smuzhiyun 	region->ar.start = start;
42*4882a593Smuzhiyun 	region->ar.end = end;
43*4882a593Smuzhiyun 	region->nr_accesses = 0;
44*4882a593Smuzhiyun 	INIT_LIST_HEAD(&region->list);
45*4882a593Smuzhiyun 
46*4882a593Smuzhiyun 	region->age = 0;
47*4882a593Smuzhiyun 	region->last_nr_accesses = 0;
48*4882a593Smuzhiyun 
49*4882a593Smuzhiyun 	return region;
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun 
damon_add_region(struct damon_region * r,struct damon_target * t)52*4882a593Smuzhiyun void damon_add_region(struct damon_region *r, struct damon_target *t)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun 	list_add_tail(&r->list, &t->regions_list);
55*4882a593Smuzhiyun 	t->nr_regions++;
56*4882a593Smuzhiyun }
57*4882a593Smuzhiyun 
damon_del_region(struct damon_region * r,struct damon_target * t)58*4882a593Smuzhiyun static void damon_del_region(struct damon_region *r, struct damon_target *t)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun 	list_del(&r->list);
61*4882a593Smuzhiyun 	t->nr_regions--;
62*4882a593Smuzhiyun }
63*4882a593Smuzhiyun 
damon_free_region(struct damon_region * r)64*4882a593Smuzhiyun static void damon_free_region(struct damon_region *r)
65*4882a593Smuzhiyun {
66*4882a593Smuzhiyun 	kfree(r);
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun 
damon_destroy_region(struct damon_region * r,struct damon_target * t)69*4882a593Smuzhiyun void damon_destroy_region(struct damon_region *r, struct damon_target *t)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun 	damon_del_region(r, t);
72*4882a593Smuzhiyun 	damon_free_region(r);
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun 
damon_new_scheme(unsigned long min_sz_region,unsigned long max_sz_region,unsigned int min_nr_accesses,unsigned int max_nr_accesses,unsigned int min_age_region,unsigned int max_age_region,enum damos_action action,struct damos_quota * quota,struct damos_watermarks * wmarks)75*4882a593Smuzhiyun struct damos *damon_new_scheme(
76*4882a593Smuzhiyun 		unsigned long min_sz_region, unsigned long max_sz_region,
77*4882a593Smuzhiyun 		unsigned int min_nr_accesses, unsigned int max_nr_accesses,
78*4882a593Smuzhiyun 		unsigned int min_age_region, unsigned int max_age_region,
79*4882a593Smuzhiyun 		enum damos_action action, struct damos_quota *quota,
80*4882a593Smuzhiyun 		struct damos_watermarks *wmarks)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun 	struct damos *scheme;
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun 	scheme = kmalloc(sizeof(*scheme), GFP_KERNEL);
85*4882a593Smuzhiyun 	if (!scheme)
86*4882a593Smuzhiyun 		return NULL;
87*4882a593Smuzhiyun 	scheme->min_sz_region = min_sz_region;
88*4882a593Smuzhiyun 	scheme->max_sz_region = max_sz_region;
89*4882a593Smuzhiyun 	scheme->min_nr_accesses = min_nr_accesses;
90*4882a593Smuzhiyun 	scheme->max_nr_accesses = max_nr_accesses;
91*4882a593Smuzhiyun 	scheme->min_age_region = min_age_region;
92*4882a593Smuzhiyun 	scheme->max_age_region = max_age_region;
93*4882a593Smuzhiyun 	scheme->action = action;
94*4882a593Smuzhiyun 	scheme->stat = (struct damos_stat){};
95*4882a593Smuzhiyun 	INIT_LIST_HEAD(&scheme->list);
96*4882a593Smuzhiyun 
97*4882a593Smuzhiyun 	scheme->quota.ms = quota->ms;
98*4882a593Smuzhiyun 	scheme->quota.sz = quota->sz;
99*4882a593Smuzhiyun 	scheme->quota.reset_interval = quota->reset_interval;
100*4882a593Smuzhiyun 	scheme->quota.weight_sz = quota->weight_sz;
101*4882a593Smuzhiyun 	scheme->quota.weight_nr_accesses = quota->weight_nr_accesses;
102*4882a593Smuzhiyun 	scheme->quota.weight_age = quota->weight_age;
103*4882a593Smuzhiyun 	scheme->quota.total_charged_sz = 0;
104*4882a593Smuzhiyun 	scheme->quota.total_charged_ns = 0;
105*4882a593Smuzhiyun 	scheme->quota.esz = 0;
106*4882a593Smuzhiyun 	scheme->quota.charged_sz = 0;
107*4882a593Smuzhiyun 	scheme->quota.charged_from = 0;
108*4882a593Smuzhiyun 	scheme->quota.charge_target_from = NULL;
109*4882a593Smuzhiyun 	scheme->quota.charge_addr_from = 0;
110*4882a593Smuzhiyun 
111*4882a593Smuzhiyun 	scheme->wmarks.metric = wmarks->metric;
112*4882a593Smuzhiyun 	scheme->wmarks.interval = wmarks->interval;
113*4882a593Smuzhiyun 	scheme->wmarks.high = wmarks->high;
114*4882a593Smuzhiyun 	scheme->wmarks.mid = wmarks->mid;
115*4882a593Smuzhiyun 	scheme->wmarks.low = wmarks->low;
116*4882a593Smuzhiyun 	scheme->wmarks.activated = true;
117*4882a593Smuzhiyun 
118*4882a593Smuzhiyun 	return scheme;
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun 
damon_add_scheme(struct damon_ctx * ctx,struct damos * s)121*4882a593Smuzhiyun void damon_add_scheme(struct damon_ctx *ctx, struct damos *s)
122*4882a593Smuzhiyun {
123*4882a593Smuzhiyun 	list_add_tail(&s->list, &ctx->schemes);
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun 
damon_del_scheme(struct damos * s)126*4882a593Smuzhiyun static void damon_del_scheme(struct damos *s)
127*4882a593Smuzhiyun {
128*4882a593Smuzhiyun 	list_del(&s->list);
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun 
damon_free_scheme(struct damos * s)131*4882a593Smuzhiyun static void damon_free_scheme(struct damos *s)
132*4882a593Smuzhiyun {
133*4882a593Smuzhiyun 	kfree(s);
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun 
damon_destroy_scheme(struct damos * s)136*4882a593Smuzhiyun void damon_destroy_scheme(struct damos *s)
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun 	damon_del_scheme(s);
139*4882a593Smuzhiyun 	damon_free_scheme(s);
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun 
142*4882a593Smuzhiyun /*
143*4882a593Smuzhiyun  * Construct a damon_target struct
144*4882a593Smuzhiyun  *
145*4882a593Smuzhiyun  * Returns the pointer to the new struct if success, or NULL otherwise
146*4882a593Smuzhiyun  */
damon_new_target(unsigned long id)147*4882a593Smuzhiyun struct damon_target *damon_new_target(unsigned long id)
148*4882a593Smuzhiyun {
149*4882a593Smuzhiyun 	struct damon_target *t;
150*4882a593Smuzhiyun 
151*4882a593Smuzhiyun 	t = kmalloc(sizeof(*t), GFP_KERNEL);
152*4882a593Smuzhiyun 	if (!t)
153*4882a593Smuzhiyun 		return NULL;
154*4882a593Smuzhiyun 
155*4882a593Smuzhiyun 	t->id = id;
156*4882a593Smuzhiyun 	t->nr_regions = 0;
157*4882a593Smuzhiyun 	INIT_LIST_HEAD(&t->regions_list);
158*4882a593Smuzhiyun 	INIT_LIST_HEAD(&t->list);
159*4882a593Smuzhiyun 
160*4882a593Smuzhiyun 	return t;
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun 
damon_add_target(struct damon_ctx * ctx,struct damon_target * t)163*4882a593Smuzhiyun void damon_add_target(struct damon_ctx *ctx, struct damon_target *t)
164*4882a593Smuzhiyun {
165*4882a593Smuzhiyun 	list_add_tail(&t->list, &ctx->adaptive_targets);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun 
damon_targets_empty(struct damon_ctx * ctx)168*4882a593Smuzhiyun bool damon_targets_empty(struct damon_ctx *ctx)
169*4882a593Smuzhiyun {
170*4882a593Smuzhiyun 	return list_empty(&ctx->adaptive_targets);
171*4882a593Smuzhiyun }
172*4882a593Smuzhiyun 
damon_del_target(struct damon_target * t)173*4882a593Smuzhiyun static void damon_del_target(struct damon_target *t)
174*4882a593Smuzhiyun {
175*4882a593Smuzhiyun 	list_del(&t->list);
176*4882a593Smuzhiyun }
177*4882a593Smuzhiyun 
damon_free_target(struct damon_target * t)178*4882a593Smuzhiyun void damon_free_target(struct damon_target *t)
179*4882a593Smuzhiyun {
180*4882a593Smuzhiyun 	struct damon_region *r, *next;
181*4882a593Smuzhiyun 
182*4882a593Smuzhiyun 	damon_for_each_region_safe(r, next, t)
183*4882a593Smuzhiyun 		damon_free_region(r);
184*4882a593Smuzhiyun 	kfree(t);
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun 
damon_destroy_target(struct damon_target * t)187*4882a593Smuzhiyun void damon_destroy_target(struct damon_target *t)
188*4882a593Smuzhiyun {
189*4882a593Smuzhiyun 	damon_del_target(t);
190*4882a593Smuzhiyun 	damon_free_target(t);
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun 
damon_nr_regions(struct damon_target * t)193*4882a593Smuzhiyun unsigned int damon_nr_regions(struct damon_target *t)
194*4882a593Smuzhiyun {
195*4882a593Smuzhiyun 	return t->nr_regions;
196*4882a593Smuzhiyun }
197*4882a593Smuzhiyun 
damon_new_ctx(void)198*4882a593Smuzhiyun struct damon_ctx *damon_new_ctx(void)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun 	struct damon_ctx *ctx;
201*4882a593Smuzhiyun 
202*4882a593Smuzhiyun 	ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
203*4882a593Smuzhiyun 	if (!ctx)
204*4882a593Smuzhiyun 		return NULL;
205*4882a593Smuzhiyun 
206*4882a593Smuzhiyun 	ctx->sample_interval = 5 * 1000;
207*4882a593Smuzhiyun 	ctx->aggr_interval = 100 * 1000;
208*4882a593Smuzhiyun 	ctx->primitive_update_interval = 60 * 1000 * 1000;
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 	ktime_get_coarse_ts64(&ctx->last_aggregation);
211*4882a593Smuzhiyun 	ctx->last_primitive_update = ctx->last_aggregation;
212*4882a593Smuzhiyun 
213*4882a593Smuzhiyun 	mutex_init(&ctx->kdamond_lock);
214*4882a593Smuzhiyun 
215*4882a593Smuzhiyun 	ctx->min_nr_regions = 10;
216*4882a593Smuzhiyun 	ctx->max_nr_regions = 1000;
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 	INIT_LIST_HEAD(&ctx->adaptive_targets);
219*4882a593Smuzhiyun 	INIT_LIST_HEAD(&ctx->schemes);
220*4882a593Smuzhiyun 
221*4882a593Smuzhiyun 	return ctx;
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun 
damon_destroy_targets(struct damon_ctx * ctx)224*4882a593Smuzhiyun static void damon_destroy_targets(struct damon_ctx *ctx)
225*4882a593Smuzhiyun {
226*4882a593Smuzhiyun 	struct damon_target *t, *next_t;
227*4882a593Smuzhiyun 
228*4882a593Smuzhiyun 	if (ctx->primitive.cleanup) {
229*4882a593Smuzhiyun 		ctx->primitive.cleanup(ctx);
230*4882a593Smuzhiyun 		return;
231*4882a593Smuzhiyun 	}
232*4882a593Smuzhiyun 
233*4882a593Smuzhiyun 	damon_for_each_target_safe(t, next_t, ctx)
234*4882a593Smuzhiyun 		damon_destroy_target(t);
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun 
damon_destroy_ctx(struct damon_ctx * ctx)237*4882a593Smuzhiyun void damon_destroy_ctx(struct damon_ctx *ctx)
238*4882a593Smuzhiyun {
239*4882a593Smuzhiyun 	struct damos *s, *next_s;
240*4882a593Smuzhiyun 
241*4882a593Smuzhiyun 	damon_destroy_targets(ctx);
242*4882a593Smuzhiyun 
243*4882a593Smuzhiyun 	damon_for_each_scheme_safe(s, next_s, ctx)
244*4882a593Smuzhiyun 		damon_destroy_scheme(s);
245*4882a593Smuzhiyun 
246*4882a593Smuzhiyun 	kfree(ctx);
247*4882a593Smuzhiyun }
248*4882a593Smuzhiyun 
249*4882a593Smuzhiyun /**
250*4882a593Smuzhiyun  * damon_set_targets() - Set monitoring targets.
251*4882a593Smuzhiyun  * @ctx:	monitoring context
252*4882a593Smuzhiyun  * @ids:	array of target ids
253*4882a593Smuzhiyun  * @nr_ids:	number of entries in @ids
254*4882a593Smuzhiyun  *
255*4882a593Smuzhiyun  * This function should not be called while the kdamond is running.
256*4882a593Smuzhiyun  *
257*4882a593Smuzhiyun  * Return: 0 on success, negative error code otherwise.
258*4882a593Smuzhiyun  */
damon_set_targets(struct damon_ctx * ctx,unsigned long * ids,ssize_t nr_ids)259*4882a593Smuzhiyun int damon_set_targets(struct damon_ctx *ctx,
260*4882a593Smuzhiyun 		      unsigned long *ids, ssize_t nr_ids)
261*4882a593Smuzhiyun {
262*4882a593Smuzhiyun 	ssize_t i;
263*4882a593Smuzhiyun 	struct damon_target *t, *next;
264*4882a593Smuzhiyun 
265*4882a593Smuzhiyun 	damon_destroy_targets(ctx);
266*4882a593Smuzhiyun 
267*4882a593Smuzhiyun 	for (i = 0; i < nr_ids; i++) {
268*4882a593Smuzhiyun 		t = damon_new_target(ids[i]);
269*4882a593Smuzhiyun 		if (!t) {
270*4882a593Smuzhiyun 			/* The caller should do cleanup of the ids itself */
271*4882a593Smuzhiyun 			damon_for_each_target_safe(t, next, ctx)
272*4882a593Smuzhiyun 				damon_destroy_target(t);
273*4882a593Smuzhiyun 			return -ENOMEM;
274*4882a593Smuzhiyun 		}
275*4882a593Smuzhiyun 		damon_add_target(ctx, t);
276*4882a593Smuzhiyun 	}
277*4882a593Smuzhiyun 
278*4882a593Smuzhiyun 	return 0;
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun 
281*4882a593Smuzhiyun /**
282*4882a593Smuzhiyun  * damon_set_attrs() - Set attributes for the monitoring.
283*4882a593Smuzhiyun  * @ctx:		monitoring context
284*4882a593Smuzhiyun  * @sample_int:		time interval between samplings
285*4882a593Smuzhiyun  * @aggr_int:		time interval between aggregations
286*4882a593Smuzhiyun  * @primitive_upd_int:	time interval between monitoring primitive updates
287*4882a593Smuzhiyun  * @min_nr_reg:		minimal number of regions
288*4882a593Smuzhiyun  * @max_nr_reg:		maximum number of regions
289*4882a593Smuzhiyun  *
290*4882a593Smuzhiyun  * This function should not be called while the kdamond is running.
291*4882a593Smuzhiyun  * Every time interval is in micro-seconds.
292*4882a593Smuzhiyun  *
293*4882a593Smuzhiyun  * Return: 0 on success, negative error code otherwise.
294*4882a593Smuzhiyun  */
damon_set_attrs(struct damon_ctx * ctx,unsigned long sample_int,unsigned long aggr_int,unsigned long primitive_upd_int,unsigned long min_nr_reg,unsigned long max_nr_reg)295*4882a593Smuzhiyun int damon_set_attrs(struct damon_ctx *ctx, unsigned long sample_int,
296*4882a593Smuzhiyun 		    unsigned long aggr_int, unsigned long primitive_upd_int,
297*4882a593Smuzhiyun 		    unsigned long min_nr_reg, unsigned long max_nr_reg)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun 	if (min_nr_reg < 3)
300*4882a593Smuzhiyun 		return -EINVAL;
301*4882a593Smuzhiyun 	if (min_nr_reg > max_nr_reg)
302*4882a593Smuzhiyun 		return -EINVAL;
303*4882a593Smuzhiyun 
304*4882a593Smuzhiyun 	ctx->sample_interval = sample_int;
305*4882a593Smuzhiyun 	ctx->aggr_interval = aggr_int;
306*4882a593Smuzhiyun 	ctx->primitive_update_interval = primitive_upd_int;
307*4882a593Smuzhiyun 	ctx->min_nr_regions = min_nr_reg;
308*4882a593Smuzhiyun 	ctx->max_nr_regions = max_nr_reg;
309*4882a593Smuzhiyun 
310*4882a593Smuzhiyun 	return 0;
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun 
313*4882a593Smuzhiyun /**
314*4882a593Smuzhiyun  * damon_set_schemes() - Set data access monitoring based operation schemes.
315*4882a593Smuzhiyun  * @ctx:	monitoring context
316*4882a593Smuzhiyun  * @schemes:	array of the schemes
317*4882a593Smuzhiyun  * @nr_schemes:	number of entries in @schemes
318*4882a593Smuzhiyun  *
319*4882a593Smuzhiyun  * This function should not be called while the kdamond of the context is
320*4882a593Smuzhiyun  * running.
321*4882a593Smuzhiyun  *
322*4882a593Smuzhiyun  * Return: 0 if success, or negative error code otherwise.
323*4882a593Smuzhiyun  */
damon_set_schemes(struct damon_ctx * ctx,struct damos ** schemes,ssize_t nr_schemes)324*4882a593Smuzhiyun int damon_set_schemes(struct damon_ctx *ctx, struct damos **schemes,
325*4882a593Smuzhiyun 			ssize_t nr_schemes)
326*4882a593Smuzhiyun {
327*4882a593Smuzhiyun 	struct damos *s, *next;
328*4882a593Smuzhiyun 	ssize_t i;
329*4882a593Smuzhiyun 
330*4882a593Smuzhiyun 	damon_for_each_scheme_safe(s, next, ctx)
331*4882a593Smuzhiyun 		damon_destroy_scheme(s);
332*4882a593Smuzhiyun 	for (i = 0; i < nr_schemes; i++)
333*4882a593Smuzhiyun 		damon_add_scheme(ctx, schemes[i]);
334*4882a593Smuzhiyun 	return 0;
335*4882a593Smuzhiyun }
336*4882a593Smuzhiyun 
337*4882a593Smuzhiyun /**
338*4882a593Smuzhiyun  * damon_nr_running_ctxs() - Return number of currently running contexts.
339*4882a593Smuzhiyun  */
damon_nr_running_ctxs(void)340*4882a593Smuzhiyun int damon_nr_running_ctxs(void)
341*4882a593Smuzhiyun {
342*4882a593Smuzhiyun 	int nr_ctxs;
343*4882a593Smuzhiyun 
344*4882a593Smuzhiyun 	mutex_lock(&damon_lock);
345*4882a593Smuzhiyun 	nr_ctxs = nr_running_ctxs;
346*4882a593Smuzhiyun 	mutex_unlock(&damon_lock);
347*4882a593Smuzhiyun 
348*4882a593Smuzhiyun 	return nr_ctxs;
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun 
351*4882a593Smuzhiyun /* Returns the size upper limit for each monitoring region */
damon_region_sz_limit(struct damon_ctx * ctx)352*4882a593Smuzhiyun static unsigned long damon_region_sz_limit(struct damon_ctx *ctx)
353*4882a593Smuzhiyun {
354*4882a593Smuzhiyun 	struct damon_target *t;
355*4882a593Smuzhiyun 	struct damon_region *r;
356*4882a593Smuzhiyun 	unsigned long sz = 0;
357*4882a593Smuzhiyun 
358*4882a593Smuzhiyun 	damon_for_each_target(t, ctx) {
359*4882a593Smuzhiyun 		damon_for_each_region(r, t)
360*4882a593Smuzhiyun 			sz += r->ar.end - r->ar.start;
361*4882a593Smuzhiyun 	}
362*4882a593Smuzhiyun 
363*4882a593Smuzhiyun 	if (ctx->min_nr_regions)
364*4882a593Smuzhiyun 		sz /= ctx->min_nr_regions;
365*4882a593Smuzhiyun 	if (sz < DAMON_MIN_REGION)
366*4882a593Smuzhiyun 		sz = DAMON_MIN_REGION;
367*4882a593Smuzhiyun 
368*4882a593Smuzhiyun 	return sz;
369*4882a593Smuzhiyun }
370*4882a593Smuzhiyun 
371*4882a593Smuzhiyun static int kdamond_fn(void *data);
372*4882a593Smuzhiyun 
373*4882a593Smuzhiyun /*
374*4882a593Smuzhiyun  * __damon_start() - Starts monitoring with given context.
375*4882a593Smuzhiyun  * @ctx:	monitoring context
376*4882a593Smuzhiyun  *
377*4882a593Smuzhiyun  * This function should be called while damon_lock is hold.
378*4882a593Smuzhiyun  *
379*4882a593Smuzhiyun  * Return: 0 on success, negative error code otherwise.
380*4882a593Smuzhiyun  */
__damon_start(struct damon_ctx * ctx)381*4882a593Smuzhiyun static int __damon_start(struct damon_ctx *ctx)
382*4882a593Smuzhiyun {
383*4882a593Smuzhiyun 	int err = -EBUSY;
384*4882a593Smuzhiyun 
385*4882a593Smuzhiyun 	mutex_lock(&ctx->kdamond_lock);
386*4882a593Smuzhiyun 	if (!ctx->kdamond) {
387*4882a593Smuzhiyun 		err = 0;
388*4882a593Smuzhiyun 		ctx->kdamond = kthread_run(kdamond_fn, ctx, "kdamond.%d",
389*4882a593Smuzhiyun 				nr_running_ctxs);
390*4882a593Smuzhiyun 		if (IS_ERR(ctx->kdamond)) {
391*4882a593Smuzhiyun 			err = PTR_ERR(ctx->kdamond);
392*4882a593Smuzhiyun 			ctx->kdamond = NULL;
393*4882a593Smuzhiyun 		}
394*4882a593Smuzhiyun 	}
395*4882a593Smuzhiyun 	mutex_unlock(&ctx->kdamond_lock);
396*4882a593Smuzhiyun 
397*4882a593Smuzhiyun 	return err;
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun 
400*4882a593Smuzhiyun /**
401*4882a593Smuzhiyun  * damon_start() - Starts the monitorings for a given group of contexts.
402*4882a593Smuzhiyun  * @ctxs:	an array of the pointers for contexts to start monitoring
403*4882a593Smuzhiyun  * @nr_ctxs:	size of @ctxs
404*4882a593Smuzhiyun  *
405*4882a593Smuzhiyun  * This function starts a group of monitoring threads for a group of monitoring
406*4882a593Smuzhiyun  * contexts.  One thread per each context is created and run in parallel.  The
407*4882a593Smuzhiyun  * caller should handle synchronization between the threads by itself.  If a
408*4882a593Smuzhiyun  * group of threads that created by other 'damon_start()' call is currently
409*4882a593Smuzhiyun  * running, this function does nothing but returns -EBUSY.
410*4882a593Smuzhiyun  *
411*4882a593Smuzhiyun  * Return: 0 on success, negative error code otherwise.
412*4882a593Smuzhiyun  */
damon_start(struct damon_ctx ** ctxs,int nr_ctxs)413*4882a593Smuzhiyun int damon_start(struct damon_ctx **ctxs, int nr_ctxs)
414*4882a593Smuzhiyun {
415*4882a593Smuzhiyun 	int i;
416*4882a593Smuzhiyun 	int err = 0;
417*4882a593Smuzhiyun 
418*4882a593Smuzhiyun 	mutex_lock(&damon_lock);
419*4882a593Smuzhiyun 	if (nr_running_ctxs) {
420*4882a593Smuzhiyun 		mutex_unlock(&damon_lock);
421*4882a593Smuzhiyun 		return -EBUSY;
422*4882a593Smuzhiyun 	}
423*4882a593Smuzhiyun 
424*4882a593Smuzhiyun 	for (i = 0; i < nr_ctxs; i++) {
425*4882a593Smuzhiyun 		err = __damon_start(ctxs[i]);
426*4882a593Smuzhiyun 		if (err)
427*4882a593Smuzhiyun 			break;
428*4882a593Smuzhiyun 		nr_running_ctxs++;
429*4882a593Smuzhiyun 	}
430*4882a593Smuzhiyun 	mutex_unlock(&damon_lock);
431*4882a593Smuzhiyun 
432*4882a593Smuzhiyun 	return err;
433*4882a593Smuzhiyun }
434*4882a593Smuzhiyun 
435*4882a593Smuzhiyun /*
436*4882a593Smuzhiyun  * __damon_stop() - Stops monitoring of given context.
437*4882a593Smuzhiyun  * @ctx:	monitoring context
438*4882a593Smuzhiyun  *
439*4882a593Smuzhiyun  * Return: 0 on success, negative error code otherwise.
440*4882a593Smuzhiyun  */
__damon_stop(struct damon_ctx * ctx)441*4882a593Smuzhiyun static int __damon_stop(struct damon_ctx *ctx)
442*4882a593Smuzhiyun {
443*4882a593Smuzhiyun 	struct task_struct *tsk;
444*4882a593Smuzhiyun 
445*4882a593Smuzhiyun 	mutex_lock(&ctx->kdamond_lock);
446*4882a593Smuzhiyun 	tsk = ctx->kdamond;
447*4882a593Smuzhiyun 	if (tsk) {
448*4882a593Smuzhiyun 		get_task_struct(tsk);
449*4882a593Smuzhiyun 		mutex_unlock(&ctx->kdamond_lock);
450*4882a593Smuzhiyun 		kthread_stop(tsk);
451*4882a593Smuzhiyun 		put_task_struct(tsk);
452*4882a593Smuzhiyun 		return 0;
453*4882a593Smuzhiyun 	}
454*4882a593Smuzhiyun 	mutex_unlock(&ctx->kdamond_lock);
455*4882a593Smuzhiyun 
456*4882a593Smuzhiyun 	return -EPERM;
457*4882a593Smuzhiyun }
458*4882a593Smuzhiyun 
459*4882a593Smuzhiyun /**
460*4882a593Smuzhiyun  * damon_stop() - Stops the monitorings for a given group of contexts.
461*4882a593Smuzhiyun  * @ctxs:	an array of the pointers for contexts to stop monitoring
462*4882a593Smuzhiyun  * @nr_ctxs:	size of @ctxs
463*4882a593Smuzhiyun  *
464*4882a593Smuzhiyun  * Return: 0 on success, negative error code otherwise.
465*4882a593Smuzhiyun  */
damon_stop(struct damon_ctx ** ctxs,int nr_ctxs)466*4882a593Smuzhiyun int damon_stop(struct damon_ctx **ctxs, int nr_ctxs)
467*4882a593Smuzhiyun {
468*4882a593Smuzhiyun 	int i, err = 0;
469*4882a593Smuzhiyun 
470*4882a593Smuzhiyun 	for (i = 0; i < nr_ctxs; i++) {
471*4882a593Smuzhiyun 		/* nr_running_ctxs is decremented in kdamond_fn */
472*4882a593Smuzhiyun 		err = __damon_stop(ctxs[i]);
473*4882a593Smuzhiyun 		if (err)
474*4882a593Smuzhiyun 			return err;
475*4882a593Smuzhiyun 	}
476*4882a593Smuzhiyun 
477*4882a593Smuzhiyun 	return err;
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun 
480*4882a593Smuzhiyun /*
481*4882a593Smuzhiyun  * damon_check_reset_time_interval() - Check if a time interval is elapsed.
482*4882a593Smuzhiyun  * @baseline:	the time to check whether the interval has elapsed since
483*4882a593Smuzhiyun  * @interval:	the time interval (microseconds)
484*4882a593Smuzhiyun  *
485*4882a593Smuzhiyun  * See whether the given time interval has passed since the given baseline
486*4882a593Smuzhiyun  * time.  If so, it also updates the baseline to current time for next check.
487*4882a593Smuzhiyun  *
488*4882a593Smuzhiyun  * Return:	true if the time interval has passed, or false otherwise.
489*4882a593Smuzhiyun  */
damon_check_reset_time_interval(struct timespec64 * baseline,unsigned long interval)490*4882a593Smuzhiyun static bool damon_check_reset_time_interval(struct timespec64 *baseline,
491*4882a593Smuzhiyun 		unsigned long interval)
492*4882a593Smuzhiyun {
493*4882a593Smuzhiyun 	struct timespec64 now;
494*4882a593Smuzhiyun 
495*4882a593Smuzhiyun 	ktime_get_coarse_ts64(&now);
496*4882a593Smuzhiyun 	if ((timespec64_to_ns(&now) - timespec64_to_ns(baseline)) <
497*4882a593Smuzhiyun 			interval * 1000)
498*4882a593Smuzhiyun 		return false;
499*4882a593Smuzhiyun 	*baseline = now;
500*4882a593Smuzhiyun 	return true;
501*4882a593Smuzhiyun }
502*4882a593Smuzhiyun 
503*4882a593Smuzhiyun /*
504*4882a593Smuzhiyun  * Check whether it is time to flush the aggregated information
505*4882a593Smuzhiyun  */
kdamond_aggregate_interval_passed(struct damon_ctx * ctx)506*4882a593Smuzhiyun static bool kdamond_aggregate_interval_passed(struct damon_ctx *ctx)
507*4882a593Smuzhiyun {
508*4882a593Smuzhiyun 	return damon_check_reset_time_interval(&ctx->last_aggregation,
509*4882a593Smuzhiyun 			ctx->aggr_interval);
510*4882a593Smuzhiyun }
511*4882a593Smuzhiyun 
512*4882a593Smuzhiyun /*
513*4882a593Smuzhiyun  * Reset the aggregated monitoring results ('nr_accesses' of each region).
514*4882a593Smuzhiyun  */
kdamond_reset_aggregated(struct damon_ctx * c)515*4882a593Smuzhiyun static void kdamond_reset_aggregated(struct damon_ctx *c)
516*4882a593Smuzhiyun {
517*4882a593Smuzhiyun 	struct damon_target *t;
518*4882a593Smuzhiyun 	unsigned int ti = 0;	/* target's index */
519*4882a593Smuzhiyun 
520*4882a593Smuzhiyun 	damon_for_each_target(t, c) {
521*4882a593Smuzhiyun 		struct damon_region *r;
522*4882a593Smuzhiyun 
523*4882a593Smuzhiyun 		damon_for_each_region(r, t) {
524*4882a593Smuzhiyun 			trace_damon_aggregated(t, ti, r, damon_nr_regions(t));
525*4882a593Smuzhiyun 			r->last_nr_accesses = r->nr_accesses;
526*4882a593Smuzhiyun 			r->nr_accesses = 0;
527*4882a593Smuzhiyun 		}
528*4882a593Smuzhiyun 		ti++;
529*4882a593Smuzhiyun 	}
530*4882a593Smuzhiyun }
531*4882a593Smuzhiyun 
532*4882a593Smuzhiyun static void damon_split_region_at(struct damon_ctx *ctx,
533*4882a593Smuzhiyun 		struct damon_target *t, struct damon_region *r,
534*4882a593Smuzhiyun 		unsigned long sz_r);
535*4882a593Smuzhiyun 
__damos_valid_target(struct damon_region * r,struct damos * s)536*4882a593Smuzhiyun static bool __damos_valid_target(struct damon_region *r, struct damos *s)
537*4882a593Smuzhiyun {
538*4882a593Smuzhiyun 	unsigned long sz;
539*4882a593Smuzhiyun 
540*4882a593Smuzhiyun 	sz = r->ar.end - r->ar.start;
541*4882a593Smuzhiyun 	return s->min_sz_region <= sz && sz <= s->max_sz_region &&
542*4882a593Smuzhiyun 		s->min_nr_accesses <= r->nr_accesses &&
543*4882a593Smuzhiyun 		r->nr_accesses <= s->max_nr_accesses &&
544*4882a593Smuzhiyun 		s->min_age_region <= r->age && r->age <= s->max_age_region;
545*4882a593Smuzhiyun }
546*4882a593Smuzhiyun 
damos_valid_target(struct damon_ctx * c,struct damon_target * t,struct damon_region * r,struct damos * s)547*4882a593Smuzhiyun static bool damos_valid_target(struct damon_ctx *c, struct damon_target *t,
548*4882a593Smuzhiyun 		struct damon_region *r, struct damos *s)
549*4882a593Smuzhiyun {
550*4882a593Smuzhiyun 	bool ret = __damos_valid_target(r, s);
551*4882a593Smuzhiyun 
552*4882a593Smuzhiyun 	if (!ret || !s->quota.esz || !c->primitive.get_scheme_score)
553*4882a593Smuzhiyun 		return ret;
554*4882a593Smuzhiyun 
555*4882a593Smuzhiyun 	return c->primitive.get_scheme_score(c, t, r, s) >= s->quota.min_score;
556*4882a593Smuzhiyun }
557*4882a593Smuzhiyun 
damon_do_apply_schemes(struct damon_ctx * c,struct damon_target * t,struct damon_region * r)558*4882a593Smuzhiyun static void damon_do_apply_schemes(struct damon_ctx *c,
559*4882a593Smuzhiyun 				   struct damon_target *t,
560*4882a593Smuzhiyun 				   struct damon_region *r)
561*4882a593Smuzhiyun {
562*4882a593Smuzhiyun 	struct damos *s;
563*4882a593Smuzhiyun 
564*4882a593Smuzhiyun 	damon_for_each_scheme(s, c) {
565*4882a593Smuzhiyun 		struct damos_quota *quota = &s->quota;
566*4882a593Smuzhiyun 		unsigned long sz = r->ar.end - r->ar.start;
567*4882a593Smuzhiyun 		struct timespec64 begin, end;
568*4882a593Smuzhiyun 		unsigned long sz_applied = 0;
569*4882a593Smuzhiyun 
570*4882a593Smuzhiyun 		if (!s->wmarks.activated)
571*4882a593Smuzhiyun 			continue;
572*4882a593Smuzhiyun 
573*4882a593Smuzhiyun 		/* Check the quota */
574*4882a593Smuzhiyun 		if (quota->esz && quota->charged_sz >= quota->esz)
575*4882a593Smuzhiyun 			continue;
576*4882a593Smuzhiyun 
577*4882a593Smuzhiyun 		/* Skip previously charged regions */
578*4882a593Smuzhiyun 		if (quota->charge_target_from) {
579*4882a593Smuzhiyun 			if (t != quota->charge_target_from)
580*4882a593Smuzhiyun 				continue;
581*4882a593Smuzhiyun 			if (r == damon_last_region(t)) {
582*4882a593Smuzhiyun 				quota->charge_target_from = NULL;
583*4882a593Smuzhiyun 				quota->charge_addr_from = 0;
584*4882a593Smuzhiyun 				continue;
585*4882a593Smuzhiyun 			}
586*4882a593Smuzhiyun 			if (quota->charge_addr_from &&
587*4882a593Smuzhiyun 					r->ar.end <= quota->charge_addr_from)
588*4882a593Smuzhiyun 				continue;
589*4882a593Smuzhiyun 
590*4882a593Smuzhiyun 			if (quota->charge_addr_from && r->ar.start <
591*4882a593Smuzhiyun 					quota->charge_addr_from) {
592*4882a593Smuzhiyun 				sz = ALIGN_DOWN(quota->charge_addr_from -
593*4882a593Smuzhiyun 						r->ar.start, DAMON_MIN_REGION);
594*4882a593Smuzhiyun 				if (!sz) {
595*4882a593Smuzhiyun 					if (r->ar.end - r->ar.start <=
596*4882a593Smuzhiyun 							DAMON_MIN_REGION)
597*4882a593Smuzhiyun 						continue;
598*4882a593Smuzhiyun 					sz = DAMON_MIN_REGION;
599*4882a593Smuzhiyun 				}
600*4882a593Smuzhiyun 				damon_split_region_at(c, t, r, sz);
601*4882a593Smuzhiyun 				r = damon_next_region(r);
602*4882a593Smuzhiyun 				sz = r->ar.end - r->ar.start;
603*4882a593Smuzhiyun 			}
604*4882a593Smuzhiyun 			quota->charge_target_from = NULL;
605*4882a593Smuzhiyun 			quota->charge_addr_from = 0;
606*4882a593Smuzhiyun 		}
607*4882a593Smuzhiyun 
608*4882a593Smuzhiyun 		if (!damos_valid_target(c, t, r, s))
609*4882a593Smuzhiyun 			continue;
610*4882a593Smuzhiyun 
611*4882a593Smuzhiyun 		/* Apply the scheme */
612*4882a593Smuzhiyun 		if (c->primitive.apply_scheme) {
613*4882a593Smuzhiyun 			if (quota->esz &&
614*4882a593Smuzhiyun 					quota->charged_sz + sz > quota->esz) {
615*4882a593Smuzhiyun 				sz = ALIGN_DOWN(quota->esz - quota->charged_sz,
616*4882a593Smuzhiyun 						DAMON_MIN_REGION);
617*4882a593Smuzhiyun 				if (!sz)
618*4882a593Smuzhiyun 					goto update_stat;
619*4882a593Smuzhiyun 				damon_split_region_at(c, t, r, sz);
620*4882a593Smuzhiyun 			}
621*4882a593Smuzhiyun 			ktime_get_coarse_ts64(&begin);
622*4882a593Smuzhiyun 			sz_applied = c->primitive.apply_scheme(c, t, r, s);
623*4882a593Smuzhiyun 			ktime_get_coarse_ts64(&end);
624*4882a593Smuzhiyun 			quota->total_charged_ns += timespec64_to_ns(&end) -
625*4882a593Smuzhiyun 				timespec64_to_ns(&begin);
626*4882a593Smuzhiyun 			quota->charged_sz += sz;
627*4882a593Smuzhiyun 			if (quota->esz && quota->charged_sz >= quota->esz) {
628*4882a593Smuzhiyun 				quota->charge_target_from = t;
629*4882a593Smuzhiyun 				quota->charge_addr_from = r->ar.end + 1;
630*4882a593Smuzhiyun 			}
631*4882a593Smuzhiyun 		}
632*4882a593Smuzhiyun 		if (s->action != DAMOS_STAT)
633*4882a593Smuzhiyun 			r->age = 0;
634*4882a593Smuzhiyun 
635*4882a593Smuzhiyun update_stat:
636*4882a593Smuzhiyun 		s->stat.nr_tried++;
637*4882a593Smuzhiyun 		s->stat.sz_tried += sz;
638*4882a593Smuzhiyun 		if (sz_applied)
639*4882a593Smuzhiyun 			s->stat.nr_applied++;
640*4882a593Smuzhiyun 		s->stat.sz_applied += sz_applied;
641*4882a593Smuzhiyun 	}
642*4882a593Smuzhiyun }
643*4882a593Smuzhiyun 
644*4882a593Smuzhiyun /* Shouldn't be called if quota->ms and quota->sz are zero */
damos_set_effective_quota(struct damos_quota * quota)645*4882a593Smuzhiyun static void damos_set_effective_quota(struct damos_quota *quota)
646*4882a593Smuzhiyun {
647*4882a593Smuzhiyun 	unsigned long throughput;
648*4882a593Smuzhiyun 	unsigned long esz;
649*4882a593Smuzhiyun 
650*4882a593Smuzhiyun 	if (!quota->ms) {
651*4882a593Smuzhiyun 		quota->esz = quota->sz;
652*4882a593Smuzhiyun 		return;
653*4882a593Smuzhiyun 	}
654*4882a593Smuzhiyun 
655*4882a593Smuzhiyun 	if (quota->total_charged_ns)
656*4882a593Smuzhiyun 		throughput = quota->total_charged_sz * 1000000 /
657*4882a593Smuzhiyun 			quota->total_charged_ns;
658*4882a593Smuzhiyun 	else
659*4882a593Smuzhiyun 		throughput = PAGE_SIZE * 1024;
660*4882a593Smuzhiyun 	esz = throughput * quota->ms;
661*4882a593Smuzhiyun 
662*4882a593Smuzhiyun 	if (quota->sz && quota->sz < esz)
663*4882a593Smuzhiyun 		esz = quota->sz;
664*4882a593Smuzhiyun 	quota->esz = esz;
665*4882a593Smuzhiyun }
666*4882a593Smuzhiyun 
kdamond_apply_schemes(struct damon_ctx * c)667*4882a593Smuzhiyun static void kdamond_apply_schemes(struct damon_ctx *c)
668*4882a593Smuzhiyun {
669*4882a593Smuzhiyun 	struct damon_target *t;
670*4882a593Smuzhiyun 	struct damon_region *r, *next_r;
671*4882a593Smuzhiyun 	struct damos *s;
672*4882a593Smuzhiyun 
673*4882a593Smuzhiyun 	damon_for_each_scheme(s, c) {
674*4882a593Smuzhiyun 		struct damos_quota *quota = &s->quota;
675*4882a593Smuzhiyun 		unsigned long cumulated_sz;
676*4882a593Smuzhiyun 		unsigned int score, max_score = 0;
677*4882a593Smuzhiyun 
678*4882a593Smuzhiyun 		if (!s->wmarks.activated)
679*4882a593Smuzhiyun 			continue;
680*4882a593Smuzhiyun 
681*4882a593Smuzhiyun 		if (!quota->ms && !quota->sz)
682*4882a593Smuzhiyun 			continue;
683*4882a593Smuzhiyun 
684*4882a593Smuzhiyun 		/* New charge window starts */
685*4882a593Smuzhiyun 		if (time_after_eq(jiffies, quota->charged_from +
686*4882a593Smuzhiyun 					msecs_to_jiffies(
687*4882a593Smuzhiyun 						quota->reset_interval))) {
688*4882a593Smuzhiyun 			if (quota->esz && quota->charged_sz >= quota->esz)
689*4882a593Smuzhiyun 				s->stat.qt_exceeds++;
690*4882a593Smuzhiyun 			quota->total_charged_sz += quota->charged_sz;
691*4882a593Smuzhiyun 			quota->charged_from = jiffies;
692*4882a593Smuzhiyun 			quota->charged_sz = 0;
693*4882a593Smuzhiyun 			damos_set_effective_quota(quota);
694*4882a593Smuzhiyun 		}
695*4882a593Smuzhiyun 
696*4882a593Smuzhiyun 		if (!c->primitive.get_scheme_score)
697*4882a593Smuzhiyun 			continue;
698*4882a593Smuzhiyun 
699*4882a593Smuzhiyun 		/* Fill up the score histogram */
700*4882a593Smuzhiyun 		memset(quota->histogram, 0, sizeof(quota->histogram));
701*4882a593Smuzhiyun 		damon_for_each_target(t, c) {
702*4882a593Smuzhiyun 			damon_for_each_region(r, t) {
703*4882a593Smuzhiyun 				if (!__damos_valid_target(r, s))
704*4882a593Smuzhiyun 					continue;
705*4882a593Smuzhiyun 				score = c->primitive.get_scheme_score(
706*4882a593Smuzhiyun 						c, t, r, s);
707*4882a593Smuzhiyun 				quota->histogram[score] +=
708*4882a593Smuzhiyun 					r->ar.end - r->ar.start;
709*4882a593Smuzhiyun 				if (score > max_score)
710*4882a593Smuzhiyun 					max_score = score;
711*4882a593Smuzhiyun 			}
712*4882a593Smuzhiyun 		}
713*4882a593Smuzhiyun 
714*4882a593Smuzhiyun 		/* Set the min score limit */
715*4882a593Smuzhiyun 		for (cumulated_sz = 0, score = max_score; ; score--) {
716*4882a593Smuzhiyun 			cumulated_sz += quota->histogram[score];
717*4882a593Smuzhiyun 			if (cumulated_sz >= quota->esz || !score)
718*4882a593Smuzhiyun 				break;
719*4882a593Smuzhiyun 		}
720*4882a593Smuzhiyun 		quota->min_score = score;
721*4882a593Smuzhiyun 	}
722*4882a593Smuzhiyun 
723*4882a593Smuzhiyun 	damon_for_each_target(t, c) {
724*4882a593Smuzhiyun 		damon_for_each_region_safe(r, next_r, t)
725*4882a593Smuzhiyun 			damon_do_apply_schemes(c, t, r);
726*4882a593Smuzhiyun 	}
727*4882a593Smuzhiyun }
728*4882a593Smuzhiyun 
sz_damon_region(struct damon_region * r)729*4882a593Smuzhiyun static inline unsigned long sz_damon_region(struct damon_region *r)
730*4882a593Smuzhiyun {
731*4882a593Smuzhiyun 	return r->ar.end - r->ar.start;
732*4882a593Smuzhiyun }
733*4882a593Smuzhiyun 
734*4882a593Smuzhiyun /*
735*4882a593Smuzhiyun  * Merge two adjacent regions into one region
736*4882a593Smuzhiyun  */
damon_merge_two_regions(struct damon_target * t,struct damon_region * l,struct damon_region * r)737*4882a593Smuzhiyun static void damon_merge_two_regions(struct damon_target *t,
738*4882a593Smuzhiyun 		struct damon_region *l, struct damon_region *r)
739*4882a593Smuzhiyun {
740*4882a593Smuzhiyun 	unsigned long sz_l = sz_damon_region(l), sz_r = sz_damon_region(r);
741*4882a593Smuzhiyun 
742*4882a593Smuzhiyun 	l->nr_accesses = (l->nr_accesses * sz_l + r->nr_accesses * sz_r) /
743*4882a593Smuzhiyun 			(sz_l + sz_r);
744*4882a593Smuzhiyun 	l->age = (l->age * sz_l + r->age * sz_r) / (sz_l + sz_r);
745*4882a593Smuzhiyun 	l->ar.end = r->ar.end;
746*4882a593Smuzhiyun 	damon_destroy_region(r, t);
747*4882a593Smuzhiyun }
748*4882a593Smuzhiyun 
749*4882a593Smuzhiyun /*
750*4882a593Smuzhiyun  * Merge adjacent regions having similar access frequencies
751*4882a593Smuzhiyun  *
752*4882a593Smuzhiyun  * t		target affected by this merge operation
753*4882a593Smuzhiyun  * thres	'->nr_accesses' diff threshold for the merge
754*4882a593Smuzhiyun  * sz_limit	size upper limit of each region
755*4882a593Smuzhiyun  */
damon_merge_regions_of(struct damon_target * t,unsigned int thres,unsigned long sz_limit)756*4882a593Smuzhiyun static void damon_merge_regions_of(struct damon_target *t, unsigned int thres,
757*4882a593Smuzhiyun 				   unsigned long sz_limit)
758*4882a593Smuzhiyun {
759*4882a593Smuzhiyun 	struct damon_region *r, *prev = NULL, *next;
760*4882a593Smuzhiyun 
761*4882a593Smuzhiyun 	damon_for_each_region_safe(r, next, t) {
762*4882a593Smuzhiyun 		if (abs(r->nr_accesses - r->last_nr_accesses) > thres)
763*4882a593Smuzhiyun 			r->age = 0;
764*4882a593Smuzhiyun 		else
765*4882a593Smuzhiyun 			r->age++;
766*4882a593Smuzhiyun 
767*4882a593Smuzhiyun 		if (prev && prev->ar.end == r->ar.start &&
768*4882a593Smuzhiyun 		    abs(prev->nr_accesses - r->nr_accesses) <= thres &&
769*4882a593Smuzhiyun 		    sz_damon_region(prev) + sz_damon_region(r) <= sz_limit)
770*4882a593Smuzhiyun 			damon_merge_two_regions(t, prev, r);
771*4882a593Smuzhiyun 		else
772*4882a593Smuzhiyun 			prev = r;
773*4882a593Smuzhiyun 	}
774*4882a593Smuzhiyun }
775*4882a593Smuzhiyun 
776*4882a593Smuzhiyun /*
777*4882a593Smuzhiyun  * Merge adjacent regions having similar access frequencies
778*4882a593Smuzhiyun  *
779*4882a593Smuzhiyun  * threshold	'->nr_accesses' diff threshold for the merge
780*4882a593Smuzhiyun  * sz_limit	size upper limit of each region
781*4882a593Smuzhiyun  *
782*4882a593Smuzhiyun  * This function merges monitoring target regions which are adjacent and their
783*4882a593Smuzhiyun  * access frequencies are similar.  This is for minimizing the monitoring
784*4882a593Smuzhiyun  * overhead under the dynamically changeable access pattern.  If a merge was
785*4882a593Smuzhiyun  * unnecessarily made, later 'kdamond_split_regions()' will revert it.
786*4882a593Smuzhiyun  */
kdamond_merge_regions(struct damon_ctx * c,unsigned int threshold,unsigned long sz_limit)787*4882a593Smuzhiyun static void kdamond_merge_regions(struct damon_ctx *c, unsigned int threshold,
788*4882a593Smuzhiyun 				  unsigned long sz_limit)
789*4882a593Smuzhiyun {
790*4882a593Smuzhiyun 	struct damon_target *t;
791*4882a593Smuzhiyun 
792*4882a593Smuzhiyun 	damon_for_each_target(t, c)
793*4882a593Smuzhiyun 		damon_merge_regions_of(t, threshold, sz_limit);
794*4882a593Smuzhiyun }
795*4882a593Smuzhiyun 
796*4882a593Smuzhiyun /*
797*4882a593Smuzhiyun  * Split a region in two
798*4882a593Smuzhiyun  *
799*4882a593Smuzhiyun  * r		the region to be split
800*4882a593Smuzhiyun  * sz_r		size of the first sub-region that will be made
801*4882a593Smuzhiyun  */
damon_split_region_at(struct damon_ctx * ctx,struct damon_target * t,struct damon_region * r,unsigned long sz_r)802*4882a593Smuzhiyun static void damon_split_region_at(struct damon_ctx *ctx,
803*4882a593Smuzhiyun 		struct damon_target *t, struct damon_region *r,
804*4882a593Smuzhiyun 		unsigned long sz_r)
805*4882a593Smuzhiyun {
806*4882a593Smuzhiyun 	struct damon_region *new;
807*4882a593Smuzhiyun 
808*4882a593Smuzhiyun 	new = damon_new_region(r->ar.start + sz_r, r->ar.end);
809*4882a593Smuzhiyun 	if (!new)
810*4882a593Smuzhiyun 		return;
811*4882a593Smuzhiyun 
812*4882a593Smuzhiyun 	r->ar.end = new->ar.start;
813*4882a593Smuzhiyun 
814*4882a593Smuzhiyun 	new->age = r->age;
815*4882a593Smuzhiyun 	new->last_nr_accesses = r->last_nr_accesses;
816*4882a593Smuzhiyun 
817*4882a593Smuzhiyun 	damon_insert_region(new, r, damon_next_region(r), t);
818*4882a593Smuzhiyun }
819*4882a593Smuzhiyun 
820*4882a593Smuzhiyun /* Split every region in the given target into 'nr_subs' regions */
damon_split_regions_of(struct damon_ctx * ctx,struct damon_target * t,int nr_subs)821*4882a593Smuzhiyun static void damon_split_regions_of(struct damon_ctx *ctx,
822*4882a593Smuzhiyun 				     struct damon_target *t, int nr_subs)
823*4882a593Smuzhiyun {
824*4882a593Smuzhiyun 	struct damon_region *r, *next;
825*4882a593Smuzhiyun 	unsigned long sz_region, sz_sub = 0;
826*4882a593Smuzhiyun 	int i;
827*4882a593Smuzhiyun 
828*4882a593Smuzhiyun 	damon_for_each_region_safe(r, next, t) {
829*4882a593Smuzhiyun 		sz_region = r->ar.end - r->ar.start;
830*4882a593Smuzhiyun 
831*4882a593Smuzhiyun 		for (i = 0; i < nr_subs - 1 &&
832*4882a593Smuzhiyun 				sz_region > 2 * DAMON_MIN_REGION; i++) {
833*4882a593Smuzhiyun 			/*
834*4882a593Smuzhiyun 			 * Randomly select size of left sub-region to be at
835*4882a593Smuzhiyun 			 * least 10 percent and at most 90% of original region
836*4882a593Smuzhiyun 			 */
837*4882a593Smuzhiyun 			sz_sub = ALIGN_DOWN(damon_rand(1, 10) *
838*4882a593Smuzhiyun 					sz_region / 10, DAMON_MIN_REGION);
839*4882a593Smuzhiyun 			/* Do not allow blank region */
840*4882a593Smuzhiyun 			if (sz_sub == 0 || sz_sub >= sz_region)
841*4882a593Smuzhiyun 				continue;
842*4882a593Smuzhiyun 
843*4882a593Smuzhiyun 			damon_split_region_at(ctx, t, r, sz_sub);
844*4882a593Smuzhiyun 			sz_region = sz_sub;
845*4882a593Smuzhiyun 		}
846*4882a593Smuzhiyun 	}
847*4882a593Smuzhiyun }
848*4882a593Smuzhiyun 
849*4882a593Smuzhiyun /*
850*4882a593Smuzhiyun  * Split every target region into randomly-sized small regions
851*4882a593Smuzhiyun  *
852*4882a593Smuzhiyun  * This function splits every target region into random-sized small regions if
853*4882a593Smuzhiyun  * current total number of the regions is equal or smaller than half of the
854*4882a593Smuzhiyun  * user-specified maximum number of regions.  This is for maximizing the
855*4882a593Smuzhiyun  * monitoring accuracy under the dynamically changeable access patterns.  If a
856*4882a593Smuzhiyun  * split was unnecessarily made, later 'kdamond_merge_regions()' will revert
857*4882a593Smuzhiyun  * it.
858*4882a593Smuzhiyun  */
kdamond_split_regions(struct damon_ctx * ctx)859*4882a593Smuzhiyun static void kdamond_split_regions(struct damon_ctx *ctx)
860*4882a593Smuzhiyun {
861*4882a593Smuzhiyun 	struct damon_target *t;
862*4882a593Smuzhiyun 	unsigned int nr_regions = 0;
863*4882a593Smuzhiyun 	static unsigned int last_nr_regions;
864*4882a593Smuzhiyun 	int nr_subregions = 2;
865*4882a593Smuzhiyun 
866*4882a593Smuzhiyun 	damon_for_each_target(t, ctx)
867*4882a593Smuzhiyun 		nr_regions += damon_nr_regions(t);
868*4882a593Smuzhiyun 
869*4882a593Smuzhiyun 	if (nr_regions > ctx->max_nr_regions / 2)
870*4882a593Smuzhiyun 		return;
871*4882a593Smuzhiyun 
872*4882a593Smuzhiyun 	/* Maybe the middle of the region has different access frequency */
873*4882a593Smuzhiyun 	if (last_nr_regions == nr_regions &&
874*4882a593Smuzhiyun 			nr_regions < ctx->max_nr_regions / 3)
875*4882a593Smuzhiyun 		nr_subregions = 3;
876*4882a593Smuzhiyun 
877*4882a593Smuzhiyun 	damon_for_each_target(t, ctx)
878*4882a593Smuzhiyun 		damon_split_regions_of(ctx, t, nr_subregions);
879*4882a593Smuzhiyun 
880*4882a593Smuzhiyun 	last_nr_regions = nr_regions;
881*4882a593Smuzhiyun }
882*4882a593Smuzhiyun 
883*4882a593Smuzhiyun /*
884*4882a593Smuzhiyun  * Check whether it is time to check and apply the target monitoring regions
885*4882a593Smuzhiyun  *
886*4882a593Smuzhiyun  * Returns true if it is.
887*4882a593Smuzhiyun  */
kdamond_need_update_primitive(struct damon_ctx * ctx)888*4882a593Smuzhiyun static bool kdamond_need_update_primitive(struct damon_ctx *ctx)
889*4882a593Smuzhiyun {
890*4882a593Smuzhiyun 	return damon_check_reset_time_interval(&ctx->last_primitive_update,
891*4882a593Smuzhiyun 			ctx->primitive_update_interval);
892*4882a593Smuzhiyun }
893*4882a593Smuzhiyun 
894*4882a593Smuzhiyun /*
895*4882a593Smuzhiyun  * Check whether current monitoring should be stopped
896*4882a593Smuzhiyun  *
897*4882a593Smuzhiyun  * The monitoring is stopped when either the user requested to stop, or all
898*4882a593Smuzhiyun  * monitoring targets are invalid.
899*4882a593Smuzhiyun  *
900*4882a593Smuzhiyun  * Returns true if need to stop current monitoring.
901*4882a593Smuzhiyun  */
kdamond_need_stop(struct damon_ctx * ctx)902*4882a593Smuzhiyun static bool kdamond_need_stop(struct damon_ctx *ctx)
903*4882a593Smuzhiyun {
904*4882a593Smuzhiyun 	struct damon_target *t;
905*4882a593Smuzhiyun 
906*4882a593Smuzhiyun 	if (kthread_should_stop())
907*4882a593Smuzhiyun 		return true;
908*4882a593Smuzhiyun 
909*4882a593Smuzhiyun 	if (!ctx->primitive.target_valid)
910*4882a593Smuzhiyun 		return false;
911*4882a593Smuzhiyun 
912*4882a593Smuzhiyun 	damon_for_each_target(t, ctx) {
913*4882a593Smuzhiyun 		if (ctx->primitive.target_valid(t))
914*4882a593Smuzhiyun 			return false;
915*4882a593Smuzhiyun 	}
916*4882a593Smuzhiyun 
917*4882a593Smuzhiyun 	return true;
918*4882a593Smuzhiyun }
919*4882a593Smuzhiyun 
damos_wmark_metric_value(enum damos_wmark_metric metric)920*4882a593Smuzhiyun static unsigned long damos_wmark_metric_value(enum damos_wmark_metric metric)
921*4882a593Smuzhiyun {
922*4882a593Smuzhiyun 	struct sysinfo i;
923*4882a593Smuzhiyun 
924*4882a593Smuzhiyun 	switch (metric) {
925*4882a593Smuzhiyun 	case DAMOS_WMARK_FREE_MEM_RATE:
926*4882a593Smuzhiyun 		si_meminfo(&i);
927*4882a593Smuzhiyun 		return i.freeram * 1000 / i.totalram;
928*4882a593Smuzhiyun 	default:
929*4882a593Smuzhiyun 		break;
930*4882a593Smuzhiyun 	}
931*4882a593Smuzhiyun 	return -EINVAL;
932*4882a593Smuzhiyun }
933*4882a593Smuzhiyun 
934*4882a593Smuzhiyun /*
935*4882a593Smuzhiyun  * Returns zero if the scheme is active.  Else, returns time to wait for next
936*4882a593Smuzhiyun  * watermark check in micro-seconds.
937*4882a593Smuzhiyun  */
damos_wmark_wait_us(struct damos * scheme)938*4882a593Smuzhiyun static unsigned long damos_wmark_wait_us(struct damos *scheme)
939*4882a593Smuzhiyun {
940*4882a593Smuzhiyun 	unsigned long metric;
941*4882a593Smuzhiyun 
942*4882a593Smuzhiyun 	if (scheme->wmarks.metric == DAMOS_WMARK_NONE)
943*4882a593Smuzhiyun 		return 0;
944*4882a593Smuzhiyun 
945*4882a593Smuzhiyun 	metric = damos_wmark_metric_value(scheme->wmarks.metric);
946*4882a593Smuzhiyun 	/* higher than high watermark or lower than low watermark */
947*4882a593Smuzhiyun 	if (metric > scheme->wmarks.high || scheme->wmarks.low > metric) {
948*4882a593Smuzhiyun 		if (scheme->wmarks.activated)
949*4882a593Smuzhiyun 			pr_debug("deactivate a scheme (%d) for %s wmark\n",
950*4882a593Smuzhiyun 					scheme->action,
951*4882a593Smuzhiyun 					metric > scheme->wmarks.high ?
952*4882a593Smuzhiyun 					"high" : "low");
953*4882a593Smuzhiyun 		scheme->wmarks.activated = false;
954*4882a593Smuzhiyun 		return scheme->wmarks.interval;
955*4882a593Smuzhiyun 	}
956*4882a593Smuzhiyun 
957*4882a593Smuzhiyun 	/* inactive and higher than middle watermark */
958*4882a593Smuzhiyun 	if ((scheme->wmarks.high >= metric && metric >= scheme->wmarks.mid) &&
959*4882a593Smuzhiyun 			!scheme->wmarks.activated)
960*4882a593Smuzhiyun 		return scheme->wmarks.interval;
961*4882a593Smuzhiyun 
962*4882a593Smuzhiyun 	if (!scheme->wmarks.activated)
963*4882a593Smuzhiyun 		pr_debug("activate a scheme (%d)\n", scheme->action);
964*4882a593Smuzhiyun 	scheme->wmarks.activated = true;
965*4882a593Smuzhiyun 	return 0;
966*4882a593Smuzhiyun }
967*4882a593Smuzhiyun 
kdamond_usleep(unsigned long usecs)968*4882a593Smuzhiyun static void kdamond_usleep(unsigned long usecs)
969*4882a593Smuzhiyun {
970*4882a593Smuzhiyun 	/* See Documentation/timers/timers-howto.rst for the thresholds */
971*4882a593Smuzhiyun 	if (usecs > 20 * USEC_PER_MSEC)
972*4882a593Smuzhiyun 		schedule_timeout_idle(usecs_to_jiffies(usecs));
973*4882a593Smuzhiyun 	else
974*4882a593Smuzhiyun 		usleep_idle_range(usecs, usecs + 1);
975*4882a593Smuzhiyun }
976*4882a593Smuzhiyun 
977*4882a593Smuzhiyun /* Returns negative error code if it's not activated but should return */
kdamond_wait_activation(struct damon_ctx * ctx)978*4882a593Smuzhiyun static int kdamond_wait_activation(struct damon_ctx *ctx)
979*4882a593Smuzhiyun {
980*4882a593Smuzhiyun 	struct damos *s;
981*4882a593Smuzhiyun 	unsigned long wait_time;
982*4882a593Smuzhiyun 	unsigned long min_wait_time = 0;
983*4882a593Smuzhiyun 
984*4882a593Smuzhiyun 	while (!kdamond_need_stop(ctx)) {
985*4882a593Smuzhiyun 		damon_for_each_scheme(s, ctx) {
986*4882a593Smuzhiyun 			wait_time = damos_wmark_wait_us(s);
987*4882a593Smuzhiyun 			if (!min_wait_time || wait_time < min_wait_time)
988*4882a593Smuzhiyun 				min_wait_time = wait_time;
989*4882a593Smuzhiyun 		}
990*4882a593Smuzhiyun 		if (!min_wait_time)
991*4882a593Smuzhiyun 			return 0;
992*4882a593Smuzhiyun 
993*4882a593Smuzhiyun 		kdamond_usleep(min_wait_time);
994*4882a593Smuzhiyun 	}
995*4882a593Smuzhiyun 	return -EBUSY;
996*4882a593Smuzhiyun }
997*4882a593Smuzhiyun 
998*4882a593Smuzhiyun /*
999*4882a593Smuzhiyun  * The monitoring daemon that runs as a kernel thread
1000*4882a593Smuzhiyun  */
kdamond_fn(void * data)1001*4882a593Smuzhiyun static int kdamond_fn(void *data)
1002*4882a593Smuzhiyun {
1003*4882a593Smuzhiyun 	struct damon_ctx *ctx = (struct damon_ctx *)data;
1004*4882a593Smuzhiyun 	struct damon_target *t;
1005*4882a593Smuzhiyun 	struct damon_region *r, *next;
1006*4882a593Smuzhiyun 	unsigned int max_nr_accesses = 0;
1007*4882a593Smuzhiyun 	unsigned long sz_limit = 0;
1008*4882a593Smuzhiyun 	bool done = false;
1009*4882a593Smuzhiyun 
1010*4882a593Smuzhiyun 	pr_debug("kdamond (%d) starts\n", current->pid);
1011*4882a593Smuzhiyun 
1012*4882a593Smuzhiyun 	if (ctx->primitive.init)
1013*4882a593Smuzhiyun 		ctx->primitive.init(ctx);
1014*4882a593Smuzhiyun 	if (ctx->callback.before_start && ctx->callback.before_start(ctx))
1015*4882a593Smuzhiyun 		done = true;
1016*4882a593Smuzhiyun 
1017*4882a593Smuzhiyun 	sz_limit = damon_region_sz_limit(ctx);
1018*4882a593Smuzhiyun 
1019*4882a593Smuzhiyun 	while (!kdamond_need_stop(ctx) && !done) {
1020*4882a593Smuzhiyun 		if (kdamond_wait_activation(ctx))
1021*4882a593Smuzhiyun 			continue;
1022*4882a593Smuzhiyun 
1023*4882a593Smuzhiyun 		if (ctx->primitive.prepare_access_checks)
1024*4882a593Smuzhiyun 			ctx->primitive.prepare_access_checks(ctx);
1025*4882a593Smuzhiyun 		if (ctx->callback.after_sampling &&
1026*4882a593Smuzhiyun 				ctx->callback.after_sampling(ctx))
1027*4882a593Smuzhiyun 			done = true;
1028*4882a593Smuzhiyun 
1029*4882a593Smuzhiyun 		kdamond_usleep(ctx->sample_interval);
1030*4882a593Smuzhiyun 
1031*4882a593Smuzhiyun 		if (ctx->primitive.check_accesses)
1032*4882a593Smuzhiyun 			max_nr_accesses = ctx->primitive.check_accesses(ctx);
1033*4882a593Smuzhiyun 
1034*4882a593Smuzhiyun 		if (kdamond_aggregate_interval_passed(ctx)) {
1035*4882a593Smuzhiyun 			kdamond_merge_regions(ctx,
1036*4882a593Smuzhiyun 					max_nr_accesses / 10,
1037*4882a593Smuzhiyun 					sz_limit);
1038*4882a593Smuzhiyun 			if (ctx->callback.after_aggregation &&
1039*4882a593Smuzhiyun 					ctx->callback.after_aggregation(ctx))
1040*4882a593Smuzhiyun 				done = true;
1041*4882a593Smuzhiyun 			kdamond_apply_schemes(ctx);
1042*4882a593Smuzhiyun 			kdamond_reset_aggregated(ctx);
1043*4882a593Smuzhiyun 			kdamond_split_regions(ctx);
1044*4882a593Smuzhiyun 			if (ctx->primitive.reset_aggregated)
1045*4882a593Smuzhiyun 				ctx->primitive.reset_aggregated(ctx);
1046*4882a593Smuzhiyun 		}
1047*4882a593Smuzhiyun 
1048*4882a593Smuzhiyun 		if (kdamond_need_update_primitive(ctx)) {
1049*4882a593Smuzhiyun 			if (ctx->primitive.update)
1050*4882a593Smuzhiyun 				ctx->primitive.update(ctx);
1051*4882a593Smuzhiyun 			sz_limit = damon_region_sz_limit(ctx);
1052*4882a593Smuzhiyun 		}
1053*4882a593Smuzhiyun 	}
1054*4882a593Smuzhiyun 	damon_for_each_target(t, ctx) {
1055*4882a593Smuzhiyun 		damon_for_each_region_safe(r, next, t)
1056*4882a593Smuzhiyun 			damon_destroy_region(r, t);
1057*4882a593Smuzhiyun 	}
1058*4882a593Smuzhiyun 
1059*4882a593Smuzhiyun 	if (ctx->callback.before_terminate)
1060*4882a593Smuzhiyun 		ctx->callback.before_terminate(ctx);
1061*4882a593Smuzhiyun 	if (ctx->primitive.cleanup)
1062*4882a593Smuzhiyun 		ctx->primitive.cleanup(ctx);
1063*4882a593Smuzhiyun 
1064*4882a593Smuzhiyun 	pr_debug("kdamond (%d) finishes\n", current->pid);
1065*4882a593Smuzhiyun 	mutex_lock(&ctx->kdamond_lock);
1066*4882a593Smuzhiyun 	ctx->kdamond = NULL;
1067*4882a593Smuzhiyun 	mutex_unlock(&ctx->kdamond_lock);
1068*4882a593Smuzhiyun 
1069*4882a593Smuzhiyun 	mutex_lock(&damon_lock);
1070*4882a593Smuzhiyun 	nr_running_ctxs--;
1071*4882a593Smuzhiyun 	mutex_unlock(&damon_lock);
1072*4882a593Smuzhiyun 
1073*4882a593Smuzhiyun 	return 0;
1074*4882a593Smuzhiyun }
1075*4882a593Smuzhiyun 
1076*4882a593Smuzhiyun #include "core-test.h"
1077