1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Data Access Monitor
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Author: SeongJae Park <sjpark@amazon.de>
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #define pr_fmt(fmt) "damon: " fmt
9*4882a593Smuzhiyun
10*4882a593Smuzhiyun #include <linux/damon.h>
11*4882a593Smuzhiyun #include <linux/delay.h>
12*4882a593Smuzhiyun #include <linux/kthread.h>
13*4882a593Smuzhiyun #include <linux/mm.h>
14*4882a593Smuzhiyun #include <linux/slab.h>
15*4882a593Smuzhiyun #include <linux/string.h>
16*4882a593Smuzhiyun
17*4882a593Smuzhiyun #define CREATE_TRACE_POINTS
18*4882a593Smuzhiyun #include <trace/events/damon.h>
19*4882a593Smuzhiyun
20*4882a593Smuzhiyun #ifdef CONFIG_DAMON_KUNIT_TEST
21*4882a593Smuzhiyun #undef DAMON_MIN_REGION
22*4882a593Smuzhiyun #define DAMON_MIN_REGION 1
23*4882a593Smuzhiyun #endif
24*4882a593Smuzhiyun
25*4882a593Smuzhiyun static DEFINE_MUTEX(damon_lock);
26*4882a593Smuzhiyun static int nr_running_ctxs;
27*4882a593Smuzhiyun
28*4882a593Smuzhiyun /*
29*4882a593Smuzhiyun * Construct a damon_region struct
30*4882a593Smuzhiyun *
31*4882a593Smuzhiyun * Returns the pointer to the new struct if success, or NULL otherwise
32*4882a593Smuzhiyun */
damon_new_region(unsigned long start,unsigned long end)33*4882a593Smuzhiyun struct damon_region *damon_new_region(unsigned long start, unsigned long end)
34*4882a593Smuzhiyun {
35*4882a593Smuzhiyun struct damon_region *region;
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun region = kmalloc(sizeof(*region), GFP_KERNEL);
38*4882a593Smuzhiyun if (!region)
39*4882a593Smuzhiyun return NULL;
40*4882a593Smuzhiyun
41*4882a593Smuzhiyun region->ar.start = start;
42*4882a593Smuzhiyun region->ar.end = end;
43*4882a593Smuzhiyun region->nr_accesses = 0;
44*4882a593Smuzhiyun INIT_LIST_HEAD(®ion->list);
45*4882a593Smuzhiyun
46*4882a593Smuzhiyun region->age = 0;
47*4882a593Smuzhiyun region->last_nr_accesses = 0;
48*4882a593Smuzhiyun
49*4882a593Smuzhiyun return region;
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
damon_add_region(struct damon_region * r,struct damon_target * t)52*4882a593Smuzhiyun void damon_add_region(struct damon_region *r, struct damon_target *t)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun list_add_tail(&r->list, &t->regions_list);
55*4882a593Smuzhiyun t->nr_regions++;
56*4882a593Smuzhiyun }
57*4882a593Smuzhiyun
damon_del_region(struct damon_region * r,struct damon_target * t)58*4882a593Smuzhiyun static void damon_del_region(struct damon_region *r, struct damon_target *t)
59*4882a593Smuzhiyun {
60*4882a593Smuzhiyun list_del(&r->list);
61*4882a593Smuzhiyun t->nr_regions--;
62*4882a593Smuzhiyun }
63*4882a593Smuzhiyun
damon_free_region(struct damon_region * r)64*4882a593Smuzhiyun static void damon_free_region(struct damon_region *r)
65*4882a593Smuzhiyun {
66*4882a593Smuzhiyun kfree(r);
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun
damon_destroy_region(struct damon_region * r,struct damon_target * t)69*4882a593Smuzhiyun void damon_destroy_region(struct damon_region *r, struct damon_target *t)
70*4882a593Smuzhiyun {
71*4882a593Smuzhiyun damon_del_region(r, t);
72*4882a593Smuzhiyun damon_free_region(r);
73*4882a593Smuzhiyun }
74*4882a593Smuzhiyun
damon_new_scheme(unsigned long min_sz_region,unsigned long max_sz_region,unsigned int min_nr_accesses,unsigned int max_nr_accesses,unsigned int min_age_region,unsigned int max_age_region,enum damos_action action,struct damos_quota * quota,struct damos_watermarks * wmarks)75*4882a593Smuzhiyun struct damos *damon_new_scheme(
76*4882a593Smuzhiyun unsigned long min_sz_region, unsigned long max_sz_region,
77*4882a593Smuzhiyun unsigned int min_nr_accesses, unsigned int max_nr_accesses,
78*4882a593Smuzhiyun unsigned int min_age_region, unsigned int max_age_region,
79*4882a593Smuzhiyun enum damos_action action, struct damos_quota *quota,
80*4882a593Smuzhiyun struct damos_watermarks *wmarks)
81*4882a593Smuzhiyun {
82*4882a593Smuzhiyun struct damos *scheme;
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun scheme = kmalloc(sizeof(*scheme), GFP_KERNEL);
85*4882a593Smuzhiyun if (!scheme)
86*4882a593Smuzhiyun return NULL;
87*4882a593Smuzhiyun scheme->min_sz_region = min_sz_region;
88*4882a593Smuzhiyun scheme->max_sz_region = max_sz_region;
89*4882a593Smuzhiyun scheme->min_nr_accesses = min_nr_accesses;
90*4882a593Smuzhiyun scheme->max_nr_accesses = max_nr_accesses;
91*4882a593Smuzhiyun scheme->min_age_region = min_age_region;
92*4882a593Smuzhiyun scheme->max_age_region = max_age_region;
93*4882a593Smuzhiyun scheme->action = action;
94*4882a593Smuzhiyun scheme->stat = (struct damos_stat){};
95*4882a593Smuzhiyun INIT_LIST_HEAD(&scheme->list);
96*4882a593Smuzhiyun
97*4882a593Smuzhiyun scheme->quota.ms = quota->ms;
98*4882a593Smuzhiyun scheme->quota.sz = quota->sz;
99*4882a593Smuzhiyun scheme->quota.reset_interval = quota->reset_interval;
100*4882a593Smuzhiyun scheme->quota.weight_sz = quota->weight_sz;
101*4882a593Smuzhiyun scheme->quota.weight_nr_accesses = quota->weight_nr_accesses;
102*4882a593Smuzhiyun scheme->quota.weight_age = quota->weight_age;
103*4882a593Smuzhiyun scheme->quota.total_charged_sz = 0;
104*4882a593Smuzhiyun scheme->quota.total_charged_ns = 0;
105*4882a593Smuzhiyun scheme->quota.esz = 0;
106*4882a593Smuzhiyun scheme->quota.charged_sz = 0;
107*4882a593Smuzhiyun scheme->quota.charged_from = 0;
108*4882a593Smuzhiyun scheme->quota.charge_target_from = NULL;
109*4882a593Smuzhiyun scheme->quota.charge_addr_from = 0;
110*4882a593Smuzhiyun
111*4882a593Smuzhiyun scheme->wmarks.metric = wmarks->metric;
112*4882a593Smuzhiyun scheme->wmarks.interval = wmarks->interval;
113*4882a593Smuzhiyun scheme->wmarks.high = wmarks->high;
114*4882a593Smuzhiyun scheme->wmarks.mid = wmarks->mid;
115*4882a593Smuzhiyun scheme->wmarks.low = wmarks->low;
116*4882a593Smuzhiyun scheme->wmarks.activated = true;
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun return scheme;
119*4882a593Smuzhiyun }
120*4882a593Smuzhiyun
damon_add_scheme(struct damon_ctx * ctx,struct damos * s)121*4882a593Smuzhiyun void damon_add_scheme(struct damon_ctx *ctx, struct damos *s)
122*4882a593Smuzhiyun {
123*4882a593Smuzhiyun list_add_tail(&s->list, &ctx->schemes);
124*4882a593Smuzhiyun }
125*4882a593Smuzhiyun
damon_del_scheme(struct damos * s)126*4882a593Smuzhiyun static void damon_del_scheme(struct damos *s)
127*4882a593Smuzhiyun {
128*4882a593Smuzhiyun list_del(&s->list);
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
damon_free_scheme(struct damos * s)131*4882a593Smuzhiyun static void damon_free_scheme(struct damos *s)
132*4882a593Smuzhiyun {
133*4882a593Smuzhiyun kfree(s);
134*4882a593Smuzhiyun }
135*4882a593Smuzhiyun
damon_destroy_scheme(struct damos * s)136*4882a593Smuzhiyun void damon_destroy_scheme(struct damos *s)
137*4882a593Smuzhiyun {
138*4882a593Smuzhiyun damon_del_scheme(s);
139*4882a593Smuzhiyun damon_free_scheme(s);
140*4882a593Smuzhiyun }
141*4882a593Smuzhiyun
142*4882a593Smuzhiyun /*
143*4882a593Smuzhiyun * Construct a damon_target struct
144*4882a593Smuzhiyun *
145*4882a593Smuzhiyun * Returns the pointer to the new struct if success, or NULL otherwise
146*4882a593Smuzhiyun */
damon_new_target(unsigned long id)147*4882a593Smuzhiyun struct damon_target *damon_new_target(unsigned long id)
148*4882a593Smuzhiyun {
149*4882a593Smuzhiyun struct damon_target *t;
150*4882a593Smuzhiyun
151*4882a593Smuzhiyun t = kmalloc(sizeof(*t), GFP_KERNEL);
152*4882a593Smuzhiyun if (!t)
153*4882a593Smuzhiyun return NULL;
154*4882a593Smuzhiyun
155*4882a593Smuzhiyun t->id = id;
156*4882a593Smuzhiyun t->nr_regions = 0;
157*4882a593Smuzhiyun INIT_LIST_HEAD(&t->regions_list);
158*4882a593Smuzhiyun INIT_LIST_HEAD(&t->list);
159*4882a593Smuzhiyun
160*4882a593Smuzhiyun return t;
161*4882a593Smuzhiyun }
162*4882a593Smuzhiyun
damon_add_target(struct damon_ctx * ctx,struct damon_target * t)163*4882a593Smuzhiyun void damon_add_target(struct damon_ctx *ctx, struct damon_target *t)
164*4882a593Smuzhiyun {
165*4882a593Smuzhiyun list_add_tail(&t->list, &ctx->adaptive_targets);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun
damon_targets_empty(struct damon_ctx * ctx)168*4882a593Smuzhiyun bool damon_targets_empty(struct damon_ctx *ctx)
169*4882a593Smuzhiyun {
170*4882a593Smuzhiyun return list_empty(&ctx->adaptive_targets);
171*4882a593Smuzhiyun }
172*4882a593Smuzhiyun
damon_del_target(struct damon_target * t)173*4882a593Smuzhiyun static void damon_del_target(struct damon_target *t)
174*4882a593Smuzhiyun {
175*4882a593Smuzhiyun list_del(&t->list);
176*4882a593Smuzhiyun }
177*4882a593Smuzhiyun
damon_free_target(struct damon_target * t)178*4882a593Smuzhiyun void damon_free_target(struct damon_target *t)
179*4882a593Smuzhiyun {
180*4882a593Smuzhiyun struct damon_region *r, *next;
181*4882a593Smuzhiyun
182*4882a593Smuzhiyun damon_for_each_region_safe(r, next, t)
183*4882a593Smuzhiyun damon_free_region(r);
184*4882a593Smuzhiyun kfree(t);
185*4882a593Smuzhiyun }
186*4882a593Smuzhiyun
damon_destroy_target(struct damon_target * t)187*4882a593Smuzhiyun void damon_destroy_target(struct damon_target *t)
188*4882a593Smuzhiyun {
189*4882a593Smuzhiyun damon_del_target(t);
190*4882a593Smuzhiyun damon_free_target(t);
191*4882a593Smuzhiyun }
192*4882a593Smuzhiyun
damon_nr_regions(struct damon_target * t)193*4882a593Smuzhiyun unsigned int damon_nr_regions(struct damon_target *t)
194*4882a593Smuzhiyun {
195*4882a593Smuzhiyun return t->nr_regions;
196*4882a593Smuzhiyun }
197*4882a593Smuzhiyun
damon_new_ctx(void)198*4882a593Smuzhiyun struct damon_ctx *damon_new_ctx(void)
199*4882a593Smuzhiyun {
200*4882a593Smuzhiyun struct damon_ctx *ctx;
201*4882a593Smuzhiyun
202*4882a593Smuzhiyun ctx = kzalloc(sizeof(*ctx), GFP_KERNEL);
203*4882a593Smuzhiyun if (!ctx)
204*4882a593Smuzhiyun return NULL;
205*4882a593Smuzhiyun
206*4882a593Smuzhiyun ctx->sample_interval = 5 * 1000;
207*4882a593Smuzhiyun ctx->aggr_interval = 100 * 1000;
208*4882a593Smuzhiyun ctx->primitive_update_interval = 60 * 1000 * 1000;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun ktime_get_coarse_ts64(&ctx->last_aggregation);
211*4882a593Smuzhiyun ctx->last_primitive_update = ctx->last_aggregation;
212*4882a593Smuzhiyun
213*4882a593Smuzhiyun mutex_init(&ctx->kdamond_lock);
214*4882a593Smuzhiyun
215*4882a593Smuzhiyun ctx->min_nr_regions = 10;
216*4882a593Smuzhiyun ctx->max_nr_regions = 1000;
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun INIT_LIST_HEAD(&ctx->adaptive_targets);
219*4882a593Smuzhiyun INIT_LIST_HEAD(&ctx->schemes);
220*4882a593Smuzhiyun
221*4882a593Smuzhiyun return ctx;
222*4882a593Smuzhiyun }
223*4882a593Smuzhiyun
damon_destroy_targets(struct damon_ctx * ctx)224*4882a593Smuzhiyun static void damon_destroy_targets(struct damon_ctx *ctx)
225*4882a593Smuzhiyun {
226*4882a593Smuzhiyun struct damon_target *t, *next_t;
227*4882a593Smuzhiyun
228*4882a593Smuzhiyun if (ctx->primitive.cleanup) {
229*4882a593Smuzhiyun ctx->primitive.cleanup(ctx);
230*4882a593Smuzhiyun return;
231*4882a593Smuzhiyun }
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun damon_for_each_target_safe(t, next_t, ctx)
234*4882a593Smuzhiyun damon_destroy_target(t);
235*4882a593Smuzhiyun }
236*4882a593Smuzhiyun
damon_destroy_ctx(struct damon_ctx * ctx)237*4882a593Smuzhiyun void damon_destroy_ctx(struct damon_ctx *ctx)
238*4882a593Smuzhiyun {
239*4882a593Smuzhiyun struct damos *s, *next_s;
240*4882a593Smuzhiyun
241*4882a593Smuzhiyun damon_destroy_targets(ctx);
242*4882a593Smuzhiyun
243*4882a593Smuzhiyun damon_for_each_scheme_safe(s, next_s, ctx)
244*4882a593Smuzhiyun damon_destroy_scheme(s);
245*4882a593Smuzhiyun
246*4882a593Smuzhiyun kfree(ctx);
247*4882a593Smuzhiyun }
248*4882a593Smuzhiyun
249*4882a593Smuzhiyun /**
250*4882a593Smuzhiyun * damon_set_targets() - Set monitoring targets.
251*4882a593Smuzhiyun * @ctx: monitoring context
252*4882a593Smuzhiyun * @ids: array of target ids
253*4882a593Smuzhiyun * @nr_ids: number of entries in @ids
254*4882a593Smuzhiyun *
255*4882a593Smuzhiyun * This function should not be called while the kdamond is running.
256*4882a593Smuzhiyun *
257*4882a593Smuzhiyun * Return: 0 on success, negative error code otherwise.
258*4882a593Smuzhiyun */
damon_set_targets(struct damon_ctx * ctx,unsigned long * ids,ssize_t nr_ids)259*4882a593Smuzhiyun int damon_set_targets(struct damon_ctx *ctx,
260*4882a593Smuzhiyun unsigned long *ids, ssize_t nr_ids)
261*4882a593Smuzhiyun {
262*4882a593Smuzhiyun ssize_t i;
263*4882a593Smuzhiyun struct damon_target *t, *next;
264*4882a593Smuzhiyun
265*4882a593Smuzhiyun damon_destroy_targets(ctx);
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun for (i = 0; i < nr_ids; i++) {
268*4882a593Smuzhiyun t = damon_new_target(ids[i]);
269*4882a593Smuzhiyun if (!t) {
270*4882a593Smuzhiyun /* The caller should do cleanup of the ids itself */
271*4882a593Smuzhiyun damon_for_each_target_safe(t, next, ctx)
272*4882a593Smuzhiyun damon_destroy_target(t);
273*4882a593Smuzhiyun return -ENOMEM;
274*4882a593Smuzhiyun }
275*4882a593Smuzhiyun damon_add_target(ctx, t);
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun
278*4882a593Smuzhiyun return 0;
279*4882a593Smuzhiyun }
280*4882a593Smuzhiyun
281*4882a593Smuzhiyun /**
282*4882a593Smuzhiyun * damon_set_attrs() - Set attributes for the monitoring.
283*4882a593Smuzhiyun * @ctx: monitoring context
284*4882a593Smuzhiyun * @sample_int: time interval between samplings
285*4882a593Smuzhiyun * @aggr_int: time interval between aggregations
286*4882a593Smuzhiyun * @primitive_upd_int: time interval between monitoring primitive updates
287*4882a593Smuzhiyun * @min_nr_reg: minimal number of regions
288*4882a593Smuzhiyun * @max_nr_reg: maximum number of regions
289*4882a593Smuzhiyun *
290*4882a593Smuzhiyun * This function should not be called while the kdamond is running.
291*4882a593Smuzhiyun * Every time interval is in micro-seconds.
292*4882a593Smuzhiyun *
293*4882a593Smuzhiyun * Return: 0 on success, negative error code otherwise.
294*4882a593Smuzhiyun */
damon_set_attrs(struct damon_ctx * ctx,unsigned long sample_int,unsigned long aggr_int,unsigned long primitive_upd_int,unsigned long min_nr_reg,unsigned long max_nr_reg)295*4882a593Smuzhiyun int damon_set_attrs(struct damon_ctx *ctx, unsigned long sample_int,
296*4882a593Smuzhiyun unsigned long aggr_int, unsigned long primitive_upd_int,
297*4882a593Smuzhiyun unsigned long min_nr_reg, unsigned long max_nr_reg)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun if (min_nr_reg < 3)
300*4882a593Smuzhiyun return -EINVAL;
301*4882a593Smuzhiyun if (min_nr_reg > max_nr_reg)
302*4882a593Smuzhiyun return -EINVAL;
303*4882a593Smuzhiyun
304*4882a593Smuzhiyun ctx->sample_interval = sample_int;
305*4882a593Smuzhiyun ctx->aggr_interval = aggr_int;
306*4882a593Smuzhiyun ctx->primitive_update_interval = primitive_upd_int;
307*4882a593Smuzhiyun ctx->min_nr_regions = min_nr_reg;
308*4882a593Smuzhiyun ctx->max_nr_regions = max_nr_reg;
309*4882a593Smuzhiyun
310*4882a593Smuzhiyun return 0;
311*4882a593Smuzhiyun }
312*4882a593Smuzhiyun
313*4882a593Smuzhiyun /**
314*4882a593Smuzhiyun * damon_set_schemes() - Set data access monitoring based operation schemes.
315*4882a593Smuzhiyun * @ctx: monitoring context
316*4882a593Smuzhiyun * @schemes: array of the schemes
317*4882a593Smuzhiyun * @nr_schemes: number of entries in @schemes
318*4882a593Smuzhiyun *
319*4882a593Smuzhiyun * This function should not be called while the kdamond of the context is
320*4882a593Smuzhiyun * running.
321*4882a593Smuzhiyun *
322*4882a593Smuzhiyun * Return: 0 if success, or negative error code otherwise.
323*4882a593Smuzhiyun */
damon_set_schemes(struct damon_ctx * ctx,struct damos ** schemes,ssize_t nr_schemes)324*4882a593Smuzhiyun int damon_set_schemes(struct damon_ctx *ctx, struct damos **schemes,
325*4882a593Smuzhiyun ssize_t nr_schemes)
326*4882a593Smuzhiyun {
327*4882a593Smuzhiyun struct damos *s, *next;
328*4882a593Smuzhiyun ssize_t i;
329*4882a593Smuzhiyun
330*4882a593Smuzhiyun damon_for_each_scheme_safe(s, next, ctx)
331*4882a593Smuzhiyun damon_destroy_scheme(s);
332*4882a593Smuzhiyun for (i = 0; i < nr_schemes; i++)
333*4882a593Smuzhiyun damon_add_scheme(ctx, schemes[i]);
334*4882a593Smuzhiyun return 0;
335*4882a593Smuzhiyun }
336*4882a593Smuzhiyun
337*4882a593Smuzhiyun /**
338*4882a593Smuzhiyun * damon_nr_running_ctxs() - Return number of currently running contexts.
339*4882a593Smuzhiyun */
damon_nr_running_ctxs(void)340*4882a593Smuzhiyun int damon_nr_running_ctxs(void)
341*4882a593Smuzhiyun {
342*4882a593Smuzhiyun int nr_ctxs;
343*4882a593Smuzhiyun
344*4882a593Smuzhiyun mutex_lock(&damon_lock);
345*4882a593Smuzhiyun nr_ctxs = nr_running_ctxs;
346*4882a593Smuzhiyun mutex_unlock(&damon_lock);
347*4882a593Smuzhiyun
348*4882a593Smuzhiyun return nr_ctxs;
349*4882a593Smuzhiyun }
350*4882a593Smuzhiyun
351*4882a593Smuzhiyun /* Returns the size upper limit for each monitoring region */
damon_region_sz_limit(struct damon_ctx * ctx)352*4882a593Smuzhiyun static unsigned long damon_region_sz_limit(struct damon_ctx *ctx)
353*4882a593Smuzhiyun {
354*4882a593Smuzhiyun struct damon_target *t;
355*4882a593Smuzhiyun struct damon_region *r;
356*4882a593Smuzhiyun unsigned long sz = 0;
357*4882a593Smuzhiyun
358*4882a593Smuzhiyun damon_for_each_target(t, ctx) {
359*4882a593Smuzhiyun damon_for_each_region(r, t)
360*4882a593Smuzhiyun sz += r->ar.end - r->ar.start;
361*4882a593Smuzhiyun }
362*4882a593Smuzhiyun
363*4882a593Smuzhiyun if (ctx->min_nr_regions)
364*4882a593Smuzhiyun sz /= ctx->min_nr_regions;
365*4882a593Smuzhiyun if (sz < DAMON_MIN_REGION)
366*4882a593Smuzhiyun sz = DAMON_MIN_REGION;
367*4882a593Smuzhiyun
368*4882a593Smuzhiyun return sz;
369*4882a593Smuzhiyun }
370*4882a593Smuzhiyun
371*4882a593Smuzhiyun static int kdamond_fn(void *data);
372*4882a593Smuzhiyun
373*4882a593Smuzhiyun /*
374*4882a593Smuzhiyun * __damon_start() - Starts monitoring with given context.
375*4882a593Smuzhiyun * @ctx: monitoring context
376*4882a593Smuzhiyun *
377*4882a593Smuzhiyun * This function should be called while damon_lock is hold.
378*4882a593Smuzhiyun *
379*4882a593Smuzhiyun * Return: 0 on success, negative error code otherwise.
380*4882a593Smuzhiyun */
__damon_start(struct damon_ctx * ctx)381*4882a593Smuzhiyun static int __damon_start(struct damon_ctx *ctx)
382*4882a593Smuzhiyun {
383*4882a593Smuzhiyun int err = -EBUSY;
384*4882a593Smuzhiyun
385*4882a593Smuzhiyun mutex_lock(&ctx->kdamond_lock);
386*4882a593Smuzhiyun if (!ctx->kdamond) {
387*4882a593Smuzhiyun err = 0;
388*4882a593Smuzhiyun ctx->kdamond = kthread_run(kdamond_fn, ctx, "kdamond.%d",
389*4882a593Smuzhiyun nr_running_ctxs);
390*4882a593Smuzhiyun if (IS_ERR(ctx->kdamond)) {
391*4882a593Smuzhiyun err = PTR_ERR(ctx->kdamond);
392*4882a593Smuzhiyun ctx->kdamond = NULL;
393*4882a593Smuzhiyun }
394*4882a593Smuzhiyun }
395*4882a593Smuzhiyun mutex_unlock(&ctx->kdamond_lock);
396*4882a593Smuzhiyun
397*4882a593Smuzhiyun return err;
398*4882a593Smuzhiyun }
399*4882a593Smuzhiyun
400*4882a593Smuzhiyun /**
401*4882a593Smuzhiyun * damon_start() - Starts the monitorings for a given group of contexts.
402*4882a593Smuzhiyun * @ctxs: an array of the pointers for contexts to start monitoring
403*4882a593Smuzhiyun * @nr_ctxs: size of @ctxs
404*4882a593Smuzhiyun *
405*4882a593Smuzhiyun * This function starts a group of monitoring threads for a group of monitoring
406*4882a593Smuzhiyun * contexts. One thread per each context is created and run in parallel. The
407*4882a593Smuzhiyun * caller should handle synchronization between the threads by itself. If a
408*4882a593Smuzhiyun * group of threads that created by other 'damon_start()' call is currently
409*4882a593Smuzhiyun * running, this function does nothing but returns -EBUSY.
410*4882a593Smuzhiyun *
411*4882a593Smuzhiyun * Return: 0 on success, negative error code otherwise.
412*4882a593Smuzhiyun */
damon_start(struct damon_ctx ** ctxs,int nr_ctxs)413*4882a593Smuzhiyun int damon_start(struct damon_ctx **ctxs, int nr_ctxs)
414*4882a593Smuzhiyun {
415*4882a593Smuzhiyun int i;
416*4882a593Smuzhiyun int err = 0;
417*4882a593Smuzhiyun
418*4882a593Smuzhiyun mutex_lock(&damon_lock);
419*4882a593Smuzhiyun if (nr_running_ctxs) {
420*4882a593Smuzhiyun mutex_unlock(&damon_lock);
421*4882a593Smuzhiyun return -EBUSY;
422*4882a593Smuzhiyun }
423*4882a593Smuzhiyun
424*4882a593Smuzhiyun for (i = 0; i < nr_ctxs; i++) {
425*4882a593Smuzhiyun err = __damon_start(ctxs[i]);
426*4882a593Smuzhiyun if (err)
427*4882a593Smuzhiyun break;
428*4882a593Smuzhiyun nr_running_ctxs++;
429*4882a593Smuzhiyun }
430*4882a593Smuzhiyun mutex_unlock(&damon_lock);
431*4882a593Smuzhiyun
432*4882a593Smuzhiyun return err;
433*4882a593Smuzhiyun }
434*4882a593Smuzhiyun
435*4882a593Smuzhiyun /*
436*4882a593Smuzhiyun * __damon_stop() - Stops monitoring of given context.
437*4882a593Smuzhiyun * @ctx: monitoring context
438*4882a593Smuzhiyun *
439*4882a593Smuzhiyun * Return: 0 on success, negative error code otherwise.
440*4882a593Smuzhiyun */
__damon_stop(struct damon_ctx * ctx)441*4882a593Smuzhiyun static int __damon_stop(struct damon_ctx *ctx)
442*4882a593Smuzhiyun {
443*4882a593Smuzhiyun struct task_struct *tsk;
444*4882a593Smuzhiyun
445*4882a593Smuzhiyun mutex_lock(&ctx->kdamond_lock);
446*4882a593Smuzhiyun tsk = ctx->kdamond;
447*4882a593Smuzhiyun if (tsk) {
448*4882a593Smuzhiyun get_task_struct(tsk);
449*4882a593Smuzhiyun mutex_unlock(&ctx->kdamond_lock);
450*4882a593Smuzhiyun kthread_stop(tsk);
451*4882a593Smuzhiyun put_task_struct(tsk);
452*4882a593Smuzhiyun return 0;
453*4882a593Smuzhiyun }
454*4882a593Smuzhiyun mutex_unlock(&ctx->kdamond_lock);
455*4882a593Smuzhiyun
456*4882a593Smuzhiyun return -EPERM;
457*4882a593Smuzhiyun }
458*4882a593Smuzhiyun
459*4882a593Smuzhiyun /**
460*4882a593Smuzhiyun * damon_stop() - Stops the monitorings for a given group of contexts.
461*4882a593Smuzhiyun * @ctxs: an array of the pointers for contexts to stop monitoring
462*4882a593Smuzhiyun * @nr_ctxs: size of @ctxs
463*4882a593Smuzhiyun *
464*4882a593Smuzhiyun * Return: 0 on success, negative error code otherwise.
465*4882a593Smuzhiyun */
damon_stop(struct damon_ctx ** ctxs,int nr_ctxs)466*4882a593Smuzhiyun int damon_stop(struct damon_ctx **ctxs, int nr_ctxs)
467*4882a593Smuzhiyun {
468*4882a593Smuzhiyun int i, err = 0;
469*4882a593Smuzhiyun
470*4882a593Smuzhiyun for (i = 0; i < nr_ctxs; i++) {
471*4882a593Smuzhiyun /* nr_running_ctxs is decremented in kdamond_fn */
472*4882a593Smuzhiyun err = __damon_stop(ctxs[i]);
473*4882a593Smuzhiyun if (err)
474*4882a593Smuzhiyun return err;
475*4882a593Smuzhiyun }
476*4882a593Smuzhiyun
477*4882a593Smuzhiyun return err;
478*4882a593Smuzhiyun }
479*4882a593Smuzhiyun
480*4882a593Smuzhiyun /*
481*4882a593Smuzhiyun * damon_check_reset_time_interval() - Check if a time interval is elapsed.
482*4882a593Smuzhiyun * @baseline: the time to check whether the interval has elapsed since
483*4882a593Smuzhiyun * @interval: the time interval (microseconds)
484*4882a593Smuzhiyun *
485*4882a593Smuzhiyun * See whether the given time interval has passed since the given baseline
486*4882a593Smuzhiyun * time. If so, it also updates the baseline to current time for next check.
487*4882a593Smuzhiyun *
488*4882a593Smuzhiyun * Return: true if the time interval has passed, or false otherwise.
489*4882a593Smuzhiyun */
damon_check_reset_time_interval(struct timespec64 * baseline,unsigned long interval)490*4882a593Smuzhiyun static bool damon_check_reset_time_interval(struct timespec64 *baseline,
491*4882a593Smuzhiyun unsigned long interval)
492*4882a593Smuzhiyun {
493*4882a593Smuzhiyun struct timespec64 now;
494*4882a593Smuzhiyun
495*4882a593Smuzhiyun ktime_get_coarse_ts64(&now);
496*4882a593Smuzhiyun if ((timespec64_to_ns(&now) - timespec64_to_ns(baseline)) <
497*4882a593Smuzhiyun interval * 1000)
498*4882a593Smuzhiyun return false;
499*4882a593Smuzhiyun *baseline = now;
500*4882a593Smuzhiyun return true;
501*4882a593Smuzhiyun }
502*4882a593Smuzhiyun
503*4882a593Smuzhiyun /*
504*4882a593Smuzhiyun * Check whether it is time to flush the aggregated information
505*4882a593Smuzhiyun */
kdamond_aggregate_interval_passed(struct damon_ctx * ctx)506*4882a593Smuzhiyun static bool kdamond_aggregate_interval_passed(struct damon_ctx *ctx)
507*4882a593Smuzhiyun {
508*4882a593Smuzhiyun return damon_check_reset_time_interval(&ctx->last_aggregation,
509*4882a593Smuzhiyun ctx->aggr_interval);
510*4882a593Smuzhiyun }
511*4882a593Smuzhiyun
512*4882a593Smuzhiyun /*
513*4882a593Smuzhiyun * Reset the aggregated monitoring results ('nr_accesses' of each region).
514*4882a593Smuzhiyun */
kdamond_reset_aggregated(struct damon_ctx * c)515*4882a593Smuzhiyun static void kdamond_reset_aggregated(struct damon_ctx *c)
516*4882a593Smuzhiyun {
517*4882a593Smuzhiyun struct damon_target *t;
518*4882a593Smuzhiyun unsigned int ti = 0; /* target's index */
519*4882a593Smuzhiyun
520*4882a593Smuzhiyun damon_for_each_target(t, c) {
521*4882a593Smuzhiyun struct damon_region *r;
522*4882a593Smuzhiyun
523*4882a593Smuzhiyun damon_for_each_region(r, t) {
524*4882a593Smuzhiyun trace_damon_aggregated(t, ti, r, damon_nr_regions(t));
525*4882a593Smuzhiyun r->last_nr_accesses = r->nr_accesses;
526*4882a593Smuzhiyun r->nr_accesses = 0;
527*4882a593Smuzhiyun }
528*4882a593Smuzhiyun ti++;
529*4882a593Smuzhiyun }
530*4882a593Smuzhiyun }
531*4882a593Smuzhiyun
532*4882a593Smuzhiyun static void damon_split_region_at(struct damon_ctx *ctx,
533*4882a593Smuzhiyun struct damon_target *t, struct damon_region *r,
534*4882a593Smuzhiyun unsigned long sz_r);
535*4882a593Smuzhiyun
__damos_valid_target(struct damon_region * r,struct damos * s)536*4882a593Smuzhiyun static bool __damos_valid_target(struct damon_region *r, struct damos *s)
537*4882a593Smuzhiyun {
538*4882a593Smuzhiyun unsigned long sz;
539*4882a593Smuzhiyun
540*4882a593Smuzhiyun sz = r->ar.end - r->ar.start;
541*4882a593Smuzhiyun return s->min_sz_region <= sz && sz <= s->max_sz_region &&
542*4882a593Smuzhiyun s->min_nr_accesses <= r->nr_accesses &&
543*4882a593Smuzhiyun r->nr_accesses <= s->max_nr_accesses &&
544*4882a593Smuzhiyun s->min_age_region <= r->age && r->age <= s->max_age_region;
545*4882a593Smuzhiyun }
546*4882a593Smuzhiyun
damos_valid_target(struct damon_ctx * c,struct damon_target * t,struct damon_region * r,struct damos * s)547*4882a593Smuzhiyun static bool damos_valid_target(struct damon_ctx *c, struct damon_target *t,
548*4882a593Smuzhiyun struct damon_region *r, struct damos *s)
549*4882a593Smuzhiyun {
550*4882a593Smuzhiyun bool ret = __damos_valid_target(r, s);
551*4882a593Smuzhiyun
552*4882a593Smuzhiyun if (!ret || !s->quota.esz || !c->primitive.get_scheme_score)
553*4882a593Smuzhiyun return ret;
554*4882a593Smuzhiyun
555*4882a593Smuzhiyun return c->primitive.get_scheme_score(c, t, r, s) >= s->quota.min_score;
556*4882a593Smuzhiyun }
557*4882a593Smuzhiyun
damon_do_apply_schemes(struct damon_ctx * c,struct damon_target * t,struct damon_region * r)558*4882a593Smuzhiyun static void damon_do_apply_schemes(struct damon_ctx *c,
559*4882a593Smuzhiyun struct damon_target *t,
560*4882a593Smuzhiyun struct damon_region *r)
561*4882a593Smuzhiyun {
562*4882a593Smuzhiyun struct damos *s;
563*4882a593Smuzhiyun
564*4882a593Smuzhiyun damon_for_each_scheme(s, c) {
565*4882a593Smuzhiyun struct damos_quota *quota = &s->quota;
566*4882a593Smuzhiyun unsigned long sz = r->ar.end - r->ar.start;
567*4882a593Smuzhiyun struct timespec64 begin, end;
568*4882a593Smuzhiyun unsigned long sz_applied = 0;
569*4882a593Smuzhiyun
570*4882a593Smuzhiyun if (!s->wmarks.activated)
571*4882a593Smuzhiyun continue;
572*4882a593Smuzhiyun
573*4882a593Smuzhiyun /* Check the quota */
574*4882a593Smuzhiyun if (quota->esz && quota->charged_sz >= quota->esz)
575*4882a593Smuzhiyun continue;
576*4882a593Smuzhiyun
577*4882a593Smuzhiyun /* Skip previously charged regions */
578*4882a593Smuzhiyun if (quota->charge_target_from) {
579*4882a593Smuzhiyun if (t != quota->charge_target_from)
580*4882a593Smuzhiyun continue;
581*4882a593Smuzhiyun if (r == damon_last_region(t)) {
582*4882a593Smuzhiyun quota->charge_target_from = NULL;
583*4882a593Smuzhiyun quota->charge_addr_from = 0;
584*4882a593Smuzhiyun continue;
585*4882a593Smuzhiyun }
586*4882a593Smuzhiyun if (quota->charge_addr_from &&
587*4882a593Smuzhiyun r->ar.end <= quota->charge_addr_from)
588*4882a593Smuzhiyun continue;
589*4882a593Smuzhiyun
590*4882a593Smuzhiyun if (quota->charge_addr_from && r->ar.start <
591*4882a593Smuzhiyun quota->charge_addr_from) {
592*4882a593Smuzhiyun sz = ALIGN_DOWN(quota->charge_addr_from -
593*4882a593Smuzhiyun r->ar.start, DAMON_MIN_REGION);
594*4882a593Smuzhiyun if (!sz) {
595*4882a593Smuzhiyun if (r->ar.end - r->ar.start <=
596*4882a593Smuzhiyun DAMON_MIN_REGION)
597*4882a593Smuzhiyun continue;
598*4882a593Smuzhiyun sz = DAMON_MIN_REGION;
599*4882a593Smuzhiyun }
600*4882a593Smuzhiyun damon_split_region_at(c, t, r, sz);
601*4882a593Smuzhiyun r = damon_next_region(r);
602*4882a593Smuzhiyun sz = r->ar.end - r->ar.start;
603*4882a593Smuzhiyun }
604*4882a593Smuzhiyun quota->charge_target_from = NULL;
605*4882a593Smuzhiyun quota->charge_addr_from = 0;
606*4882a593Smuzhiyun }
607*4882a593Smuzhiyun
608*4882a593Smuzhiyun if (!damos_valid_target(c, t, r, s))
609*4882a593Smuzhiyun continue;
610*4882a593Smuzhiyun
611*4882a593Smuzhiyun /* Apply the scheme */
612*4882a593Smuzhiyun if (c->primitive.apply_scheme) {
613*4882a593Smuzhiyun if (quota->esz &&
614*4882a593Smuzhiyun quota->charged_sz + sz > quota->esz) {
615*4882a593Smuzhiyun sz = ALIGN_DOWN(quota->esz - quota->charged_sz,
616*4882a593Smuzhiyun DAMON_MIN_REGION);
617*4882a593Smuzhiyun if (!sz)
618*4882a593Smuzhiyun goto update_stat;
619*4882a593Smuzhiyun damon_split_region_at(c, t, r, sz);
620*4882a593Smuzhiyun }
621*4882a593Smuzhiyun ktime_get_coarse_ts64(&begin);
622*4882a593Smuzhiyun sz_applied = c->primitive.apply_scheme(c, t, r, s);
623*4882a593Smuzhiyun ktime_get_coarse_ts64(&end);
624*4882a593Smuzhiyun quota->total_charged_ns += timespec64_to_ns(&end) -
625*4882a593Smuzhiyun timespec64_to_ns(&begin);
626*4882a593Smuzhiyun quota->charged_sz += sz;
627*4882a593Smuzhiyun if (quota->esz && quota->charged_sz >= quota->esz) {
628*4882a593Smuzhiyun quota->charge_target_from = t;
629*4882a593Smuzhiyun quota->charge_addr_from = r->ar.end + 1;
630*4882a593Smuzhiyun }
631*4882a593Smuzhiyun }
632*4882a593Smuzhiyun if (s->action != DAMOS_STAT)
633*4882a593Smuzhiyun r->age = 0;
634*4882a593Smuzhiyun
635*4882a593Smuzhiyun update_stat:
636*4882a593Smuzhiyun s->stat.nr_tried++;
637*4882a593Smuzhiyun s->stat.sz_tried += sz;
638*4882a593Smuzhiyun if (sz_applied)
639*4882a593Smuzhiyun s->stat.nr_applied++;
640*4882a593Smuzhiyun s->stat.sz_applied += sz_applied;
641*4882a593Smuzhiyun }
642*4882a593Smuzhiyun }
643*4882a593Smuzhiyun
644*4882a593Smuzhiyun /* Shouldn't be called if quota->ms and quota->sz are zero */
damos_set_effective_quota(struct damos_quota * quota)645*4882a593Smuzhiyun static void damos_set_effective_quota(struct damos_quota *quota)
646*4882a593Smuzhiyun {
647*4882a593Smuzhiyun unsigned long throughput;
648*4882a593Smuzhiyun unsigned long esz;
649*4882a593Smuzhiyun
650*4882a593Smuzhiyun if (!quota->ms) {
651*4882a593Smuzhiyun quota->esz = quota->sz;
652*4882a593Smuzhiyun return;
653*4882a593Smuzhiyun }
654*4882a593Smuzhiyun
655*4882a593Smuzhiyun if (quota->total_charged_ns)
656*4882a593Smuzhiyun throughput = quota->total_charged_sz * 1000000 /
657*4882a593Smuzhiyun quota->total_charged_ns;
658*4882a593Smuzhiyun else
659*4882a593Smuzhiyun throughput = PAGE_SIZE * 1024;
660*4882a593Smuzhiyun esz = throughput * quota->ms;
661*4882a593Smuzhiyun
662*4882a593Smuzhiyun if (quota->sz && quota->sz < esz)
663*4882a593Smuzhiyun esz = quota->sz;
664*4882a593Smuzhiyun quota->esz = esz;
665*4882a593Smuzhiyun }
666*4882a593Smuzhiyun
kdamond_apply_schemes(struct damon_ctx * c)667*4882a593Smuzhiyun static void kdamond_apply_schemes(struct damon_ctx *c)
668*4882a593Smuzhiyun {
669*4882a593Smuzhiyun struct damon_target *t;
670*4882a593Smuzhiyun struct damon_region *r, *next_r;
671*4882a593Smuzhiyun struct damos *s;
672*4882a593Smuzhiyun
673*4882a593Smuzhiyun damon_for_each_scheme(s, c) {
674*4882a593Smuzhiyun struct damos_quota *quota = &s->quota;
675*4882a593Smuzhiyun unsigned long cumulated_sz;
676*4882a593Smuzhiyun unsigned int score, max_score = 0;
677*4882a593Smuzhiyun
678*4882a593Smuzhiyun if (!s->wmarks.activated)
679*4882a593Smuzhiyun continue;
680*4882a593Smuzhiyun
681*4882a593Smuzhiyun if (!quota->ms && !quota->sz)
682*4882a593Smuzhiyun continue;
683*4882a593Smuzhiyun
684*4882a593Smuzhiyun /* New charge window starts */
685*4882a593Smuzhiyun if (time_after_eq(jiffies, quota->charged_from +
686*4882a593Smuzhiyun msecs_to_jiffies(
687*4882a593Smuzhiyun quota->reset_interval))) {
688*4882a593Smuzhiyun if (quota->esz && quota->charged_sz >= quota->esz)
689*4882a593Smuzhiyun s->stat.qt_exceeds++;
690*4882a593Smuzhiyun quota->total_charged_sz += quota->charged_sz;
691*4882a593Smuzhiyun quota->charged_from = jiffies;
692*4882a593Smuzhiyun quota->charged_sz = 0;
693*4882a593Smuzhiyun damos_set_effective_quota(quota);
694*4882a593Smuzhiyun }
695*4882a593Smuzhiyun
696*4882a593Smuzhiyun if (!c->primitive.get_scheme_score)
697*4882a593Smuzhiyun continue;
698*4882a593Smuzhiyun
699*4882a593Smuzhiyun /* Fill up the score histogram */
700*4882a593Smuzhiyun memset(quota->histogram, 0, sizeof(quota->histogram));
701*4882a593Smuzhiyun damon_for_each_target(t, c) {
702*4882a593Smuzhiyun damon_for_each_region(r, t) {
703*4882a593Smuzhiyun if (!__damos_valid_target(r, s))
704*4882a593Smuzhiyun continue;
705*4882a593Smuzhiyun score = c->primitive.get_scheme_score(
706*4882a593Smuzhiyun c, t, r, s);
707*4882a593Smuzhiyun quota->histogram[score] +=
708*4882a593Smuzhiyun r->ar.end - r->ar.start;
709*4882a593Smuzhiyun if (score > max_score)
710*4882a593Smuzhiyun max_score = score;
711*4882a593Smuzhiyun }
712*4882a593Smuzhiyun }
713*4882a593Smuzhiyun
714*4882a593Smuzhiyun /* Set the min score limit */
715*4882a593Smuzhiyun for (cumulated_sz = 0, score = max_score; ; score--) {
716*4882a593Smuzhiyun cumulated_sz += quota->histogram[score];
717*4882a593Smuzhiyun if (cumulated_sz >= quota->esz || !score)
718*4882a593Smuzhiyun break;
719*4882a593Smuzhiyun }
720*4882a593Smuzhiyun quota->min_score = score;
721*4882a593Smuzhiyun }
722*4882a593Smuzhiyun
723*4882a593Smuzhiyun damon_for_each_target(t, c) {
724*4882a593Smuzhiyun damon_for_each_region_safe(r, next_r, t)
725*4882a593Smuzhiyun damon_do_apply_schemes(c, t, r);
726*4882a593Smuzhiyun }
727*4882a593Smuzhiyun }
728*4882a593Smuzhiyun
sz_damon_region(struct damon_region * r)729*4882a593Smuzhiyun static inline unsigned long sz_damon_region(struct damon_region *r)
730*4882a593Smuzhiyun {
731*4882a593Smuzhiyun return r->ar.end - r->ar.start;
732*4882a593Smuzhiyun }
733*4882a593Smuzhiyun
734*4882a593Smuzhiyun /*
735*4882a593Smuzhiyun * Merge two adjacent regions into one region
736*4882a593Smuzhiyun */
damon_merge_two_regions(struct damon_target * t,struct damon_region * l,struct damon_region * r)737*4882a593Smuzhiyun static void damon_merge_two_regions(struct damon_target *t,
738*4882a593Smuzhiyun struct damon_region *l, struct damon_region *r)
739*4882a593Smuzhiyun {
740*4882a593Smuzhiyun unsigned long sz_l = sz_damon_region(l), sz_r = sz_damon_region(r);
741*4882a593Smuzhiyun
742*4882a593Smuzhiyun l->nr_accesses = (l->nr_accesses * sz_l + r->nr_accesses * sz_r) /
743*4882a593Smuzhiyun (sz_l + sz_r);
744*4882a593Smuzhiyun l->age = (l->age * sz_l + r->age * sz_r) / (sz_l + sz_r);
745*4882a593Smuzhiyun l->ar.end = r->ar.end;
746*4882a593Smuzhiyun damon_destroy_region(r, t);
747*4882a593Smuzhiyun }
748*4882a593Smuzhiyun
749*4882a593Smuzhiyun /*
750*4882a593Smuzhiyun * Merge adjacent regions having similar access frequencies
751*4882a593Smuzhiyun *
752*4882a593Smuzhiyun * t target affected by this merge operation
753*4882a593Smuzhiyun * thres '->nr_accesses' diff threshold for the merge
754*4882a593Smuzhiyun * sz_limit size upper limit of each region
755*4882a593Smuzhiyun */
damon_merge_regions_of(struct damon_target * t,unsigned int thres,unsigned long sz_limit)756*4882a593Smuzhiyun static void damon_merge_regions_of(struct damon_target *t, unsigned int thres,
757*4882a593Smuzhiyun unsigned long sz_limit)
758*4882a593Smuzhiyun {
759*4882a593Smuzhiyun struct damon_region *r, *prev = NULL, *next;
760*4882a593Smuzhiyun
761*4882a593Smuzhiyun damon_for_each_region_safe(r, next, t) {
762*4882a593Smuzhiyun if (abs(r->nr_accesses - r->last_nr_accesses) > thres)
763*4882a593Smuzhiyun r->age = 0;
764*4882a593Smuzhiyun else
765*4882a593Smuzhiyun r->age++;
766*4882a593Smuzhiyun
767*4882a593Smuzhiyun if (prev && prev->ar.end == r->ar.start &&
768*4882a593Smuzhiyun abs(prev->nr_accesses - r->nr_accesses) <= thres &&
769*4882a593Smuzhiyun sz_damon_region(prev) + sz_damon_region(r) <= sz_limit)
770*4882a593Smuzhiyun damon_merge_two_regions(t, prev, r);
771*4882a593Smuzhiyun else
772*4882a593Smuzhiyun prev = r;
773*4882a593Smuzhiyun }
774*4882a593Smuzhiyun }
775*4882a593Smuzhiyun
776*4882a593Smuzhiyun /*
777*4882a593Smuzhiyun * Merge adjacent regions having similar access frequencies
778*4882a593Smuzhiyun *
779*4882a593Smuzhiyun * threshold '->nr_accesses' diff threshold for the merge
780*4882a593Smuzhiyun * sz_limit size upper limit of each region
781*4882a593Smuzhiyun *
782*4882a593Smuzhiyun * This function merges monitoring target regions which are adjacent and their
783*4882a593Smuzhiyun * access frequencies are similar. This is for minimizing the monitoring
784*4882a593Smuzhiyun * overhead under the dynamically changeable access pattern. If a merge was
785*4882a593Smuzhiyun * unnecessarily made, later 'kdamond_split_regions()' will revert it.
786*4882a593Smuzhiyun */
kdamond_merge_regions(struct damon_ctx * c,unsigned int threshold,unsigned long sz_limit)787*4882a593Smuzhiyun static void kdamond_merge_regions(struct damon_ctx *c, unsigned int threshold,
788*4882a593Smuzhiyun unsigned long sz_limit)
789*4882a593Smuzhiyun {
790*4882a593Smuzhiyun struct damon_target *t;
791*4882a593Smuzhiyun
792*4882a593Smuzhiyun damon_for_each_target(t, c)
793*4882a593Smuzhiyun damon_merge_regions_of(t, threshold, sz_limit);
794*4882a593Smuzhiyun }
795*4882a593Smuzhiyun
796*4882a593Smuzhiyun /*
797*4882a593Smuzhiyun * Split a region in two
798*4882a593Smuzhiyun *
799*4882a593Smuzhiyun * r the region to be split
800*4882a593Smuzhiyun * sz_r size of the first sub-region that will be made
801*4882a593Smuzhiyun */
damon_split_region_at(struct damon_ctx * ctx,struct damon_target * t,struct damon_region * r,unsigned long sz_r)802*4882a593Smuzhiyun static void damon_split_region_at(struct damon_ctx *ctx,
803*4882a593Smuzhiyun struct damon_target *t, struct damon_region *r,
804*4882a593Smuzhiyun unsigned long sz_r)
805*4882a593Smuzhiyun {
806*4882a593Smuzhiyun struct damon_region *new;
807*4882a593Smuzhiyun
808*4882a593Smuzhiyun new = damon_new_region(r->ar.start + sz_r, r->ar.end);
809*4882a593Smuzhiyun if (!new)
810*4882a593Smuzhiyun return;
811*4882a593Smuzhiyun
812*4882a593Smuzhiyun r->ar.end = new->ar.start;
813*4882a593Smuzhiyun
814*4882a593Smuzhiyun new->age = r->age;
815*4882a593Smuzhiyun new->last_nr_accesses = r->last_nr_accesses;
816*4882a593Smuzhiyun
817*4882a593Smuzhiyun damon_insert_region(new, r, damon_next_region(r), t);
818*4882a593Smuzhiyun }
819*4882a593Smuzhiyun
820*4882a593Smuzhiyun /* Split every region in the given target into 'nr_subs' regions */
damon_split_regions_of(struct damon_ctx * ctx,struct damon_target * t,int nr_subs)821*4882a593Smuzhiyun static void damon_split_regions_of(struct damon_ctx *ctx,
822*4882a593Smuzhiyun struct damon_target *t, int nr_subs)
823*4882a593Smuzhiyun {
824*4882a593Smuzhiyun struct damon_region *r, *next;
825*4882a593Smuzhiyun unsigned long sz_region, sz_sub = 0;
826*4882a593Smuzhiyun int i;
827*4882a593Smuzhiyun
828*4882a593Smuzhiyun damon_for_each_region_safe(r, next, t) {
829*4882a593Smuzhiyun sz_region = r->ar.end - r->ar.start;
830*4882a593Smuzhiyun
831*4882a593Smuzhiyun for (i = 0; i < nr_subs - 1 &&
832*4882a593Smuzhiyun sz_region > 2 * DAMON_MIN_REGION; i++) {
833*4882a593Smuzhiyun /*
834*4882a593Smuzhiyun * Randomly select size of left sub-region to be at
835*4882a593Smuzhiyun * least 10 percent and at most 90% of original region
836*4882a593Smuzhiyun */
837*4882a593Smuzhiyun sz_sub = ALIGN_DOWN(damon_rand(1, 10) *
838*4882a593Smuzhiyun sz_region / 10, DAMON_MIN_REGION);
839*4882a593Smuzhiyun /* Do not allow blank region */
840*4882a593Smuzhiyun if (sz_sub == 0 || sz_sub >= sz_region)
841*4882a593Smuzhiyun continue;
842*4882a593Smuzhiyun
843*4882a593Smuzhiyun damon_split_region_at(ctx, t, r, sz_sub);
844*4882a593Smuzhiyun sz_region = sz_sub;
845*4882a593Smuzhiyun }
846*4882a593Smuzhiyun }
847*4882a593Smuzhiyun }
848*4882a593Smuzhiyun
849*4882a593Smuzhiyun /*
850*4882a593Smuzhiyun * Split every target region into randomly-sized small regions
851*4882a593Smuzhiyun *
852*4882a593Smuzhiyun * This function splits every target region into random-sized small regions if
853*4882a593Smuzhiyun * current total number of the regions is equal or smaller than half of the
854*4882a593Smuzhiyun * user-specified maximum number of regions. This is for maximizing the
855*4882a593Smuzhiyun * monitoring accuracy under the dynamically changeable access patterns. If a
856*4882a593Smuzhiyun * split was unnecessarily made, later 'kdamond_merge_regions()' will revert
857*4882a593Smuzhiyun * it.
858*4882a593Smuzhiyun */
kdamond_split_regions(struct damon_ctx * ctx)859*4882a593Smuzhiyun static void kdamond_split_regions(struct damon_ctx *ctx)
860*4882a593Smuzhiyun {
861*4882a593Smuzhiyun struct damon_target *t;
862*4882a593Smuzhiyun unsigned int nr_regions = 0;
863*4882a593Smuzhiyun static unsigned int last_nr_regions;
864*4882a593Smuzhiyun int nr_subregions = 2;
865*4882a593Smuzhiyun
866*4882a593Smuzhiyun damon_for_each_target(t, ctx)
867*4882a593Smuzhiyun nr_regions += damon_nr_regions(t);
868*4882a593Smuzhiyun
869*4882a593Smuzhiyun if (nr_regions > ctx->max_nr_regions / 2)
870*4882a593Smuzhiyun return;
871*4882a593Smuzhiyun
872*4882a593Smuzhiyun /* Maybe the middle of the region has different access frequency */
873*4882a593Smuzhiyun if (last_nr_regions == nr_regions &&
874*4882a593Smuzhiyun nr_regions < ctx->max_nr_regions / 3)
875*4882a593Smuzhiyun nr_subregions = 3;
876*4882a593Smuzhiyun
877*4882a593Smuzhiyun damon_for_each_target(t, ctx)
878*4882a593Smuzhiyun damon_split_regions_of(ctx, t, nr_subregions);
879*4882a593Smuzhiyun
880*4882a593Smuzhiyun last_nr_regions = nr_regions;
881*4882a593Smuzhiyun }
882*4882a593Smuzhiyun
883*4882a593Smuzhiyun /*
884*4882a593Smuzhiyun * Check whether it is time to check and apply the target monitoring regions
885*4882a593Smuzhiyun *
886*4882a593Smuzhiyun * Returns true if it is.
887*4882a593Smuzhiyun */
kdamond_need_update_primitive(struct damon_ctx * ctx)888*4882a593Smuzhiyun static bool kdamond_need_update_primitive(struct damon_ctx *ctx)
889*4882a593Smuzhiyun {
890*4882a593Smuzhiyun return damon_check_reset_time_interval(&ctx->last_primitive_update,
891*4882a593Smuzhiyun ctx->primitive_update_interval);
892*4882a593Smuzhiyun }
893*4882a593Smuzhiyun
894*4882a593Smuzhiyun /*
895*4882a593Smuzhiyun * Check whether current monitoring should be stopped
896*4882a593Smuzhiyun *
897*4882a593Smuzhiyun * The monitoring is stopped when either the user requested to stop, or all
898*4882a593Smuzhiyun * monitoring targets are invalid.
899*4882a593Smuzhiyun *
900*4882a593Smuzhiyun * Returns true if need to stop current monitoring.
901*4882a593Smuzhiyun */
kdamond_need_stop(struct damon_ctx * ctx)902*4882a593Smuzhiyun static bool kdamond_need_stop(struct damon_ctx *ctx)
903*4882a593Smuzhiyun {
904*4882a593Smuzhiyun struct damon_target *t;
905*4882a593Smuzhiyun
906*4882a593Smuzhiyun if (kthread_should_stop())
907*4882a593Smuzhiyun return true;
908*4882a593Smuzhiyun
909*4882a593Smuzhiyun if (!ctx->primitive.target_valid)
910*4882a593Smuzhiyun return false;
911*4882a593Smuzhiyun
912*4882a593Smuzhiyun damon_for_each_target(t, ctx) {
913*4882a593Smuzhiyun if (ctx->primitive.target_valid(t))
914*4882a593Smuzhiyun return false;
915*4882a593Smuzhiyun }
916*4882a593Smuzhiyun
917*4882a593Smuzhiyun return true;
918*4882a593Smuzhiyun }
919*4882a593Smuzhiyun
damos_wmark_metric_value(enum damos_wmark_metric metric)920*4882a593Smuzhiyun static unsigned long damos_wmark_metric_value(enum damos_wmark_metric metric)
921*4882a593Smuzhiyun {
922*4882a593Smuzhiyun struct sysinfo i;
923*4882a593Smuzhiyun
924*4882a593Smuzhiyun switch (metric) {
925*4882a593Smuzhiyun case DAMOS_WMARK_FREE_MEM_RATE:
926*4882a593Smuzhiyun si_meminfo(&i);
927*4882a593Smuzhiyun return i.freeram * 1000 / i.totalram;
928*4882a593Smuzhiyun default:
929*4882a593Smuzhiyun break;
930*4882a593Smuzhiyun }
931*4882a593Smuzhiyun return -EINVAL;
932*4882a593Smuzhiyun }
933*4882a593Smuzhiyun
934*4882a593Smuzhiyun /*
935*4882a593Smuzhiyun * Returns zero if the scheme is active. Else, returns time to wait for next
936*4882a593Smuzhiyun * watermark check in micro-seconds.
937*4882a593Smuzhiyun */
damos_wmark_wait_us(struct damos * scheme)938*4882a593Smuzhiyun static unsigned long damos_wmark_wait_us(struct damos *scheme)
939*4882a593Smuzhiyun {
940*4882a593Smuzhiyun unsigned long metric;
941*4882a593Smuzhiyun
942*4882a593Smuzhiyun if (scheme->wmarks.metric == DAMOS_WMARK_NONE)
943*4882a593Smuzhiyun return 0;
944*4882a593Smuzhiyun
945*4882a593Smuzhiyun metric = damos_wmark_metric_value(scheme->wmarks.metric);
946*4882a593Smuzhiyun /* higher than high watermark or lower than low watermark */
947*4882a593Smuzhiyun if (metric > scheme->wmarks.high || scheme->wmarks.low > metric) {
948*4882a593Smuzhiyun if (scheme->wmarks.activated)
949*4882a593Smuzhiyun pr_debug("deactivate a scheme (%d) for %s wmark\n",
950*4882a593Smuzhiyun scheme->action,
951*4882a593Smuzhiyun metric > scheme->wmarks.high ?
952*4882a593Smuzhiyun "high" : "low");
953*4882a593Smuzhiyun scheme->wmarks.activated = false;
954*4882a593Smuzhiyun return scheme->wmarks.interval;
955*4882a593Smuzhiyun }
956*4882a593Smuzhiyun
957*4882a593Smuzhiyun /* inactive and higher than middle watermark */
958*4882a593Smuzhiyun if ((scheme->wmarks.high >= metric && metric >= scheme->wmarks.mid) &&
959*4882a593Smuzhiyun !scheme->wmarks.activated)
960*4882a593Smuzhiyun return scheme->wmarks.interval;
961*4882a593Smuzhiyun
962*4882a593Smuzhiyun if (!scheme->wmarks.activated)
963*4882a593Smuzhiyun pr_debug("activate a scheme (%d)\n", scheme->action);
964*4882a593Smuzhiyun scheme->wmarks.activated = true;
965*4882a593Smuzhiyun return 0;
966*4882a593Smuzhiyun }
967*4882a593Smuzhiyun
kdamond_usleep(unsigned long usecs)968*4882a593Smuzhiyun static void kdamond_usleep(unsigned long usecs)
969*4882a593Smuzhiyun {
970*4882a593Smuzhiyun /* See Documentation/timers/timers-howto.rst for the thresholds */
971*4882a593Smuzhiyun if (usecs > 20 * USEC_PER_MSEC)
972*4882a593Smuzhiyun schedule_timeout_idle(usecs_to_jiffies(usecs));
973*4882a593Smuzhiyun else
974*4882a593Smuzhiyun usleep_idle_range(usecs, usecs + 1);
975*4882a593Smuzhiyun }
976*4882a593Smuzhiyun
977*4882a593Smuzhiyun /* Returns negative error code if it's not activated but should return */
kdamond_wait_activation(struct damon_ctx * ctx)978*4882a593Smuzhiyun static int kdamond_wait_activation(struct damon_ctx *ctx)
979*4882a593Smuzhiyun {
980*4882a593Smuzhiyun struct damos *s;
981*4882a593Smuzhiyun unsigned long wait_time;
982*4882a593Smuzhiyun unsigned long min_wait_time = 0;
983*4882a593Smuzhiyun
984*4882a593Smuzhiyun while (!kdamond_need_stop(ctx)) {
985*4882a593Smuzhiyun damon_for_each_scheme(s, ctx) {
986*4882a593Smuzhiyun wait_time = damos_wmark_wait_us(s);
987*4882a593Smuzhiyun if (!min_wait_time || wait_time < min_wait_time)
988*4882a593Smuzhiyun min_wait_time = wait_time;
989*4882a593Smuzhiyun }
990*4882a593Smuzhiyun if (!min_wait_time)
991*4882a593Smuzhiyun return 0;
992*4882a593Smuzhiyun
993*4882a593Smuzhiyun kdamond_usleep(min_wait_time);
994*4882a593Smuzhiyun }
995*4882a593Smuzhiyun return -EBUSY;
996*4882a593Smuzhiyun }
997*4882a593Smuzhiyun
998*4882a593Smuzhiyun /*
999*4882a593Smuzhiyun * The monitoring daemon that runs as a kernel thread
1000*4882a593Smuzhiyun */
kdamond_fn(void * data)1001*4882a593Smuzhiyun static int kdamond_fn(void *data)
1002*4882a593Smuzhiyun {
1003*4882a593Smuzhiyun struct damon_ctx *ctx = (struct damon_ctx *)data;
1004*4882a593Smuzhiyun struct damon_target *t;
1005*4882a593Smuzhiyun struct damon_region *r, *next;
1006*4882a593Smuzhiyun unsigned int max_nr_accesses = 0;
1007*4882a593Smuzhiyun unsigned long sz_limit = 0;
1008*4882a593Smuzhiyun bool done = false;
1009*4882a593Smuzhiyun
1010*4882a593Smuzhiyun pr_debug("kdamond (%d) starts\n", current->pid);
1011*4882a593Smuzhiyun
1012*4882a593Smuzhiyun if (ctx->primitive.init)
1013*4882a593Smuzhiyun ctx->primitive.init(ctx);
1014*4882a593Smuzhiyun if (ctx->callback.before_start && ctx->callback.before_start(ctx))
1015*4882a593Smuzhiyun done = true;
1016*4882a593Smuzhiyun
1017*4882a593Smuzhiyun sz_limit = damon_region_sz_limit(ctx);
1018*4882a593Smuzhiyun
1019*4882a593Smuzhiyun while (!kdamond_need_stop(ctx) && !done) {
1020*4882a593Smuzhiyun if (kdamond_wait_activation(ctx))
1021*4882a593Smuzhiyun continue;
1022*4882a593Smuzhiyun
1023*4882a593Smuzhiyun if (ctx->primitive.prepare_access_checks)
1024*4882a593Smuzhiyun ctx->primitive.prepare_access_checks(ctx);
1025*4882a593Smuzhiyun if (ctx->callback.after_sampling &&
1026*4882a593Smuzhiyun ctx->callback.after_sampling(ctx))
1027*4882a593Smuzhiyun done = true;
1028*4882a593Smuzhiyun
1029*4882a593Smuzhiyun kdamond_usleep(ctx->sample_interval);
1030*4882a593Smuzhiyun
1031*4882a593Smuzhiyun if (ctx->primitive.check_accesses)
1032*4882a593Smuzhiyun max_nr_accesses = ctx->primitive.check_accesses(ctx);
1033*4882a593Smuzhiyun
1034*4882a593Smuzhiyun if (kdamond_aggregate_interval_passed(ctx)) {
1035*4882a593Smuzhiyun kdamond_merge_regions(ctx,
1036*4882a593Smuzhiyun max_nr_accesses / 10,
1037*4882a593Smuzhiyun sz_limit);
1038*4882a593Smuzhiyun if (ctx->callback.after_aggregation &&
1039*4882a593Smuzhiyun ctx->callback.after_aggregation(ctx))
1040*4882a593Smuzhiyun done = true;
1041*4882a593Smuzhiyun kdamond_apply_schemes(ctx);
1042*4882a593Smuzhiyun kdamond_reset_aggregated(ctx);
1043*4882a593Smuzhiyun kdamond_split_regions(ctx);
1044*4882a593Smuzhiyun if (ctx->primitive.reset_aggregated)
1045*4882a593Smuzhiyun ctx->primitive.reset_aggregated(ctx);
1046*4882a593Smuzhiyun }
1047*4882a593Smuzhiyun
1048*4882a593Smuzhiyun if (kdamond_need_update_primitive(ctx)) {
1049*4882a593Smuzhiyun if (ctx->primitive.update)
1050*4882a593Smuzhiyun ctx->primitive.update(ctx);
1051*4882a593Smuzhiyun sz_limit = damon_region_sz_limit(ctx);
1052*4882a593Smuzhiyun }
1053*4882a593Smuzhiyun }
1054*4882a593Smuzhiyun damon_for_each_target(t, ctx) {
1055*4882a593Smuzhiyun damon_for_each_region_safe(r, next, t)
1056*4882a593Smuzhiyun damon_destroy_region(r, t);
1057*4882a593Smuzhiyun }
1058*4882a593Smuzhiyun
1059*4882a593Smuzhiyun if (ctx->callback.before_terminate)
1060*4882a593Smuzhiyun ctx->callback.before_terminate(ctx);
1061*4882a593Smuzhiyun if (ctx->primitive.cleanup)
1062*4882a593Smuzhiyun ctx->primitive.cleanup(ctx);
1063*4882a593Smuzhiyun
1064*4882a593Smuzhiyun pr_debug("kdamond (%d) finishes\n", current->pid);
1065*4882a593Smuzhiyun mutex_lock(&ctx->kdamond_lock);
1066*4882a593Smuzhiyun ctx->kdamond = NULL;
1067*4882a593Smuzhiyun mutex_unlock(&ctx->kdamond_lock);
1068*4882a593Smuzhiyun
1069*4882a593Smuzhiyun mutex_lock(&damon_lock);
1070*4882a593Smuzhiyun nr_running_ctxs--;
1071*4882a593Smuzhiyun mutex_unlock(&damon_lock);
1072*4882a593Smuzhiyun
1073*4882a593Smuzhiyun return 0;
1074*4882a593Smuzhiyun }
1075*4882a593Smuzhiyun
1076*4882a593Smuzhiyun #include "core-test.h"
1077