xref: /OK3568_Linux_fs/kernel/drivers/rknpu/rknpu_mm.c (revision 4882a59341e53eb6f0b4789bf948001014eff981)
1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun  * Copyright (C) Rockchip Electronics Co.Ltd
4*4882a593Smuzhiyun  * Author: Felix Zeng <felix.zeng@rock-chips.com>
5*4882a593Smuzhiyun  */
6*4882a593Smuzhiyun 
7*4882a593Smuzhiyun #include "rknpu_debugger.h"
8*4882a593Smuzhiyun #include "rknpu_mm.h"
9*4882a593Smuzhiyun 
rknpu_mm_create(unsigned int mem_size,unsigned int chunk_size,struct rknpu_mm ** mm)10*4882a593Smuzhiyun int rknpu_mm_create(unsigned int mem_size, unsigned int chunk_size,
11*4882a593Smuzhiyun 		    struct rknpu_mm **mm)
12*4882a593Smuzhiyun {
13*4882a593Smuzhiyun 	unsigned int num_of_longs;
14*4882a593Smuzhiyun 	int ret = -EINVAL;
15*4882a593Smuzhiyun 
16*4882a593Smuzhiyun 	if (WARN_ON(mem_size < chunk_size))
17*4882a593Smuzhiyun 		return -EINVAL;
18*4882a593Smuzhiyun 	if (WARN_ON(mem_size == 0))
19*4882a593Smuzhiyun 		return -EINVAL;
20*4882a593Smuzhiyun 	if (WARN_ON(chunk_size == 0))
21*4882a593Smuzhiyun 		return -EINVAL;
22*4882a593Smuzhiyun 
23*4882a593Smuzhiyun 	*mm = kzalloc(sizeof(struct rknpu_mm), GFP_KERNEL);
24*4882a593Smuzhiyun 	if (!(*mm))
25*4882a593Smuzhiyun 		return -ENOMEM;
26*4882a593Smuzhiyun 
27*4882a593Smuzhiyun 	(*mm)->chunk_size = chunk_size;
28*4882a593Smuzhiyun 	(*mm)->total_chunks = mem_size / chunk_size;
29*4882a593Smuzhiyun 	(*mm)->free_chunks = (*mm)->total_chunks;
30*4882a593Smuzhiyun 
31*4882a593Smuzhiyun 	num_of_longs =
32*4882a593Smuzhiyun 		((*mm)->total_chunks + BITS_PER_LONG - 1) / BITS_PER_LONG;
33*4882a593Smuzhiyun 
34*4882a593Smuzhiyun 	(*mm)->bitmap = kcalloc(num_of_longs, sizeof(long), GFP_KERNEL);
35*4882a593Smuzhiyun 	if (!(*mm)->bitmap) {
36*4882a593Smuzhiyun 		ret = -ENOMEM;
37*4882a593Smuzhiyun 		goto free_mm;
38*4882a593Smuzhiyun 	}
39*4882a593Smuzhiyun 
40*4882a593Smuzhiyun 	mutex_init(&(*mm)->lock);
41*4882a593Smuzhiyun 
42*4882a593Smuzhiyun 	LOG_DEBUG("total_chunks: %d, bitmap: %p\n", (*mm)->total_chunks,
43*4882a593Smuzhiyun 		  (*mm)->bitmap);
44*4882a593Smuzhiyun 
45*4882a593Smuzhiyun 	return 0;
46*4882a593Smuzhiyun 
47*4882a593Smuzhiyun free_mm:
48*4882a593Smuzhiyun 	kfree(mm);
49*4882a593Smuzhiyun 	return ret;
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun 
rknpu_mm_destroy(struct rknpu_mm * mm)52*4882a593Smuzhiyun void rknpu_mm_destroy(struct rknpu_mm *mm)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun 	if (mm != NULL) {
55*4882a593Smuzhiyun 		mutex_destroy(&mm->lock);
56*4882a593Smuzhiyun 		kfree(mm->bitmap);
57*4882a593Smuzhiyun 		kfree(mm);
58*4882a593Smuzhiyun 	}
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun 
rknpu_mm_alloc(struct rknpu_mm * mm,unsigned int size,struct rknpu_mm_obj ** mm_obj)61*4882a593Smuzhiyun int rknpu_mm_alloc(struct rknpu_mm *mm, unsigned int size,
62*4882a593Smuzhiyun 		   struct rknpu_mm_obj **mm_obj)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun 	unsigned int found, start_search, cur_size;
65*4882a593Smuzhiyun 
66*4882a593Smuzhiyun 	if (size == 0)
67*4882a593Smuzhiyun 		return -EINVAL;
68*4882a593Smuzhiyun 
69*4882a593Smuzhiyun 	if (size > mm->total_chunks * mm->chunk_size)
70*4882a593Smuzhiyun 		return -ENOMEM;
71*4882a593Smuzhiyun 
72*4882a593Smuzhiyun 	*mm_obj = kzalloc(sizeof(struct rknpu_mm_obj), GFP_KERNEL);
73*4882a593Smuzhiyun 	if (!(*mm_obj))
74*4882a593Smuzhiyun 		return -ENOMEM;
75*4882a593Smuzhiyun 
76*4882a593Smuzhiyun 	start_search = 0;
77*4882a593Smuzhiyun 
78*4882a593Smuzhiyun 	mutex_lock(&mm->lock);
79*4882a593Smuzhiyun 
80*4882a593Smuzhiyun mm_restart_search:
81*4882a593Smuzhiyun 	/* Find the first chunk that is free */
82*4882a593Smuzhiyun 	found = find_next_zero_bit(mm->bitmap, mm->total_chunks, start_search);
83*4882a593Smuzhiyun 
84*4882a593Smuzhiyun 	/* If there wasn't any free chunk, bail out */
85*4882a593Smuzhiyun 	if (found == mm->total_chunks)
86*4882a593Smuzhiyun 		goto mm_no_free_chunk;
87*4882a593Smuzhiyun 
88*4882a593Smuzhiyun 	/* Update fields of mm_obj */
89*4882a593Smuzhiyun 	(*mm_obj)->range_start = found;
90*4882a593Smuzhiyun 	(*mm_obj)->range_end = found;
91*4882a593Smuzhiyun 
92*4882a593Smuzhiyun 	/* If we need only one chunk, mark it as allocated and get out */
93*4882a593Smuzhiyun 	if (size <= mm->chunk_size) {
94*4882a593Smuzhiyun 		set_bit(found, mm->bitmap);
95*4882a593Smuzhiyun 		goto mm_out;
96*4882a593Smuzhiyun 	}
97*4882a593Smuzhiyun 
98*4882a593Smuzhiyun 	/* Otherwise, try to see if we have enough contiguous chunks */
99*4882a593Smuzhiyun 	cur_size = size - mm->chunk_size;
100*4882a593Smuzhiyun 	do {
101*4882a593Smuzhiyun 		(*mm_obj)->range_end = find_next_zero_bit(
102*4882a593Smuzhiyun 			mm->bitmap, mm->total_chunks, ++found);
103*4882a593Smuzhiyun 		/*
104*4882a593Smuzhiyun 		 * If next free chunk is not contiguous than we need to
105*4882a593Smuzhiyun 		 * restart our search from the last free chunk we found (which
106*4882a593Smuzhiyun 		 * wasn't contiguous to the previous ones
107*4882a593Smuzhiyun 		 */
108*4882a593Smuzhiyun 		if ((*mm_obj)->range_end != found) {
109*4882a593Smuzhiyun 			start_search = found;
110*4882a593Smuzhiyun 			goto mm_restart_search;
111*4882a593Smuzhiyun 		}
112*4882a593Smuzhiyun 
113*4882a593Smuzhiyun 		/*
114*4882a593Smuzhiyun 		 * If we reached end of buffer, bail out with error
115*4882a593Smuzhiyun 		 */
116*4882a593Smuzhiyun 		if (found == mm->total_chunks)
117*4882a593Smuzhiyun 			goto mm_no_free_chunk;
118*4882a593Smuzhiyun 
119*4882a593Smuzhiyun 		/* Check if we don't need another chunk */
120*4882a593Smuzhiyun 		if (cur_size <= mm->chunk_size)
121*4882a593Smuzhiyun 			cur_size = 0;
122*4882a593Smuzhiyun 		else
123*4882a593Smuzhiyun 			cur_size -= mm->chunk_size;
124*4882a593Smuzhiyun 
125*4882a593Smuzhiyun 	} while (cur_size > 0);
126*4882a593Smuzhiyun 
127*4882a593Smuzhiyun 	/* Mark the chunks as allocated */
128*4882a593Smuzhiyun 	for (found = (*mm_obj)->range_start; found <= (*mm_obj)->range_end;
129*4882a593Smuzhiyun 	     found++)
130*4882a593Smuzhiyun 		set_bit(found, mm->bitmap);
131*4882a593Smuzhiyun 
132*4882a593Smuzhiyun mm_out:
133*4882a593Smuzhiyun 	mm->free_chunks -= ((*mm_obj)->range_end - (*mm_obj)->range_start + 1);
134*4882a593Smuzhiyun 	mutex_unlock(&mm->lock);
135*4882a593Smuzhiyun 
136*4882a593Smuzhiyun 	LOG_DEBUG("mm allocate, mm_obj: %p, range_start: %d, range_end: %d\n",
137*4882a593Smuzhiyun 		  *mm_obj, (*mm_obj)->range_start, (*mm_obj)->range_end);
138*4882a593Smuzhiyun 
139*4882a593Smuzhiyun 	return 0;
140*4882a593Smuzhiyun 
141*4882a593Smuzhiyun mm_no_free_chunk:
142*4882a593Smuzhiyun 	mutex_unlock(&mm->lock);
143*4882a593Smuzhiyun 	kfree(*mm_obj);
144*4882a593Smuzhiyun 
145*4882a593Smuzhiyun 	return -ENOMEM;
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun 
rknpu_mm_free(struct rknpu_mm * mm,struct rknpu_mm_obj * mm_obj)148*4882a593Smuzhiyun int rknpu_mm_free(struct rknpu_mm *mm, struct rknpu_mm_obj *mm_obj)
149*4882a593Smuzhiyun {
150*4882a593Smuzhiyun 	unsigned int bit;
151*4882a593Smuzhiyun 
152*4882a593Smuzhiyun 	/* Act like kfree when trying to free a NULL object */
153*4882a593Smuzhiyun 	if (!mm_obj)
154*4882a593Smuzhiyun 		return 0;
155*4882a593Smuzhiyun 
156*4882a593Smuzhiyun 	LOG_DEBUG("mm free, mem_obj: %p, range_start: %d, range_end: %d\n",
157*4882a593Smuzhiyun 		  mm_obj, mm_obj->range_start, mm_obj->range_end);
158*4882a593Smuzhiyun 
159*4882a593Smuzhiyun 	mutex_lock(&mm->lock);
160*4882a593Smuzhiyun 
161*4882a593Smuzhiyun 	/* Mark the chunks as free */
162*4882a593Smuzhiyun 	for (bit = mm_obj->range_start; bit <= mm_obj->range_end; bit++)
163*4882a593Smuzhiyun 		clear_bit(bit, mm->bitmap);
164*4882a593Smuzhiyun 
165*4882a593Smuzhiyun 	mm->free_chunks += (mm_obj->range_end - mm_obj->range_start + 1);
166*4882a593Smuzhiyun 
167*4882a593Smuzhiyun 	mutex_unlock(&mm->lock);
168*4882a593Smuzhiyun 
169*4882a593Smuzhiyun 	kfree(mm_obj);
170*4882a593Smuzhiyun 
171*4882a593Smuzhiyun 	return 0;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun 
rknpu_mm_dump(struct seq_file * m,void * data)174*4882a593Smuzhiyun int rknpu_mm_dump(struct seq_file *m, void *data)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun 	struct rknpu_debugger_node *node = m->private;
177*4882a593Smuzhiyun 	struct rknpu_debugger *debugger = node->debugger;
178*4882a593Smuzhiyun 	struct rknpu_device *rknpu_dev =
179*4882a593Smuzhiyun 		container_of(debugger, struct rknpu_device, debugger);
180*4882a593Smuzhiyun 	struct rknpu_mm *mm = NULL;
181*4882a593Smuzhiyun 	int cur = 0, rbot = 0, rtop = 0;
182*4882a593Smuzhiyun 	size_t ret = 0;
183*4882a593Smuzhiyun 	char buf[64];
184*4882a593Smuzhiyun 	size_t size = sizeof(buf);
185*4882a593Smuzhiyun 	int seg_chunks = 32, seg_id = 0;
186*4882a593Smuzhiyun 	int free_size = 0;
187*4882a593Smuzhiyun 	int i = 0;
188*4882a593Smuzhiyun 
189*4882a593Smuzhiyun 	mm = rknpu_dev->sram_mm;
190*4882a593Smuzhiyun 	if (mm == NULL)
191*4882a593Smuzhiyun 		return 0;
192*4882a593Smuzhiyun 
193*4882a593Smuzhiyun 	seq_printf(m, "SRAM bitmap: \"*\" - used, \".\" - free (1bit = %dKB)\n",
194*4882a593Smuzhiyun 		   mm->chunk_size / 1024);
195*4882a593Smuzhiyun 
196*4882a593Smuzhiyun 	rbot = cur = find_first_bit(mm->bitmap, mm->total_chunks);
197*4882a593Smuzhiyun 	for (i = 0; i < cur; ++i) {
198*4882a593Smuzhiyun 		ret += scnprintf(buf + ret, size - ret, ".");
199*4882a593Smuzhiyun 		if (ret >= seg_chunks) {
200*4882a593Smuzhiyun 			seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
201*4882a593Smuzhiyun 			ret = 0;
202*4882a593Smuzhiyun 		}
203*4882a593Smuzhiyun 	}
204*4882a593Smuzhiyun 	while (cur < mm->total_chunks) {
205*4882a593Smuzhiyun 		rtop = cur;
206*4882a593Smuzhiyun 		cur = find_next_bit(mm->bitmap, mm->total_chunks, cur + 1);
207*4882a593Smuzhiyun 		if (cur < mm->total_chunks && cur <= rtop + 1)
208*4882a593Smuzhiyun 			continue;
209*4882a593Smuzhiyun 
210*4882a593Smuzhiyun 		for (i = rbot; i <= rtop; ++i) {
211*4882a593Smuzhiyun 			ret += scnprintf(buf + ret, size - ret, "*");
212*4882a593Smuzhiyun 			if (ret >= seg_chunks) {
213*4882a593Smuzhiyun 				seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
214*4882a593Smuzhiyun 				ret = 0;
215*4882a593Smuzhiyun 			}
216*4882a593Smuzhiyun 		}
217*4882a593Smuzhiyun 
218*4882a593Smuzhiyun 		for (i = rtop + 1; i < cur; ++i) {
219*4882a593Smuzhiyun 			ret += scnprintf(buf + ret, size - ret, ".");
220*4882a593Smuzhiyun 			if (ret >= seg_chunks) {
221*4882a593Smuzhiyun 				seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
222*4882a593Smuzhiyun 				ret = 0;
223*4882a593Smuzhiyun 			}
224*4882a593Smuzhiyun 		}
225*4882a593Smuzhiyun 
226*4882a593Smuzhiyun 		rbot = cur;
227*4882a593Smuzhiyun 	}
228*4882a593Smuzhiyun 
229*4882a593Smuzhiyun 	if (ret > 0)
230*4882a593Smuzhiyun 		seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
231*4882a593Smuzhiyun 
232*4882a593Smuzhiyun 	free_size = mm->free_chunks * mm->chunk_size;
233*4882a593Smuzhiyun 	seq_printf(m, "SRAM total size: %d, used: %d, free: %d\n",
234*4882a593Smuzhiyun 		   rknpu_dev->sram_size, rknpu_dev->sram_size - free_size,
235*4882a593Smuzhiyun 		   free_size);
236*4882a593Smuzhiyun 
237*4882a593Smuzhiyun 	return 0;
238*4882a593Smuzhiyun }
239