1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) Rockchip Electronics Co.Ltd
4*4882a593Smuzhiyun * Author: Felix Zeng <felix.zeng@rock-chips.com>
5*4882a593Smuzhiyun */
6*4882a593Smuzhiyun
7*4882a593Smuzhiyun #include "rknpu_debugger.h"
8*4882a593Smuzhiyun #include "rknpu_mm.h"
9*4882a593Smuzhiyun
rknpu_mm_create(unsigned int mem_size,unsigned int chunk_size,struct rknpu_mm ** mm)10*4882a593Smuzhiyun int rknpu_mm_create(unsigned int mem_size, unsigned int chunk_size,
11*4882a593Smuzhiyun struct rknpu_mm **mm)
12*4882a593Smuzhiyun {
13*4882a593Smuzhiyun unsigned int num_of_longs;
14*4882a593Smuzhiyun int ret = -EINVAL;
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun if (WARN_ON(mem_size < chunk_size))
17*4882a593Smuzhiyun return -EINVAL;
18*4882a593Smuzhiyun if (WARN_ON(mem_size == 0))
19*4882a593Smuzhiyun return -EINVAL;
20*4882a593Smuzhiyun if (WARN_ON(chunk_size == 0))
21*4882a593Smuzhiyun return -EINVAL;
22*4882a593Smuzhiyun
23*4882a593Smuzhiyun *mm = kzalloc(sizeof(struct rknpu_mm), GFP_KERNEL);
24*4882a593Smuzhiyun if (!(*mm))
25*4882a593Smuzhiyun return -ENOMEM;
26*4882a593Smuzhiyun
27*4882a593Smuzhiyun (*mm)->chunk_size = chunk_size;
28*4882a593Smuzhiyun (*mm)->total_chunks = mem_size / chunk_size;
29*4882a593Smuzhiyun (*mm)->free_chunks = (*mm)->total_chunks;
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun num_of_longs =
32*4882a593Smuzhiyun ((*mm)->total_chunks + BITS_PER_LONG - 1) / BITS_PER_LONG;
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun (*mm)->bitmap = kcalloc(num_of_longs, sizeof(long), GFP_KERNEL);
35*4882a593Smuzhiyun if (!(*mm)->bitmap) {
36*4882a593Smuzhiyun ret = -ENOMEM;
37*4882a593Smuzhiyun goto free_mm;
38*4882a593Smuzhiyun }
39*4882a593Smuzhiyun
40*4882a593Smuzhiyun mutex_init(&(*mm)->lock);
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun LOG_DEBUG("total_chunks: %d, bitmap: %p\n", (*mm)->total_chunks,
43*4882a593Smuzhiyun (*mm)->bitmap);
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun return 0;
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun free_mm:
48*4882a593Smuzhiyun kfree(mm);
49*4882a593Smuzhiyun return ret;
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
rknpu_mm_destroy(struct rknpu_mm * mm)52*4882a593Smuzhiyun void rknpu_mm_destroy(struct rknpu_mm *mm)
53*4882a593Smuzhiyun {
54*4882a593Smuzhiyun if (mm != NULL) {
55*4882a593Smuzhiyun mutex_destroy(&mm->lock);
56*4882a593Smuzhiyun kfree(mm->bitmap);
57*4882a593Smuzhiyun kfree(mm);
58*4882a593Smuzhiyun }
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
rknpu_mm_alloc(struct rknpu_mm * mm,unsigned int size,struct rknpu_mm_obj ** mm_obj)61*4882a593Smuzhiyun int rknpu_mm_alloc(struct rknpu_mm *mm, unsigned int size,
62*4882a593Smuzhiyun struct rknpu_mm_obj **mm_obj)
63*4882a593Smuzhiyun {
64*4882a593Smuzhiyun unsigned int found, start_search, cur_size;
65*4882a593Smuzhiyun
66*4882a593Smuzhiyun if (size == 0)
67*4882a593Smuzhiyun return -EINVAL;
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun if (size > mm->total_chunks * mm->chunk_size)
70*4882a593Smuzhiyun return -ENOMEM;
71*4882a593Smuzhiyun
72*4882a593Smuzhiyun *mm_obj = kzalloc(sizeof(struct rknpu_mm_obj), GFP_KERNEL);
73*4882a593Smuzhiyun if (!(*mm_obj))
74*4882a593Smuzhiyun return -ENOMEM;
75*4882a593Smuzhiyun
76*4882a593Smuzhiyun start_search = 0;
77*4882a593Smuzhiyun
78*4882a593Smuzhiyun mutex_lock(&mm->lock);
79*4882a593Smuzhiyun
80*4882a593Smuzhiyun mm_restart_search:
81*4882a593Smuzhiyun /* Find the first chunk that is free */
82*4882a593Smuzhiyun found = find_next_zero_bit(mm->bitmap, mm->total_chunks, start_search);
83*4882a593Smuzhiyun
84*4882a593Smuzhiyun /* If there wasn't any free chunk, bail out */
85*4882a593Smuzhiyun if (found == mm->total_chunks)
86*4882a593Smuzhiyun goto mm_no_free_chunk;
87*4882a593Smuzhiyun
88*4882a593Smuzhiyun /* Update fields of mm_obj */
89*4882a593Smuzhiyun (*mm_obj)->range_start = found;
90*4882a593Smuzhiyun (*mm_obj)->range_end = found;
91*4882a593Smuzhiyun
92*4882a593Smuzhiyun /* If we need only one chunk, mark it as allocated and get out */
93*4882a593Smuzhiyun if (size <= mm->chunk_size) {
94*4882a593Smuzhiyun set_bit(found, mm->bitmap);
95*4882a593Smuzhiyun goto mm_out;
96*4882a593Smuzhiyun }
97*4882a593Smuzhiyun
98*4882a593Smuzhiyun /* Otherwise, try to see if we have enough contiguous chunks */
99*4882a593Smuzhiyun cur_size = size - mm->chunk_size;
100*4882a593Smuzhiyun do {
101*4882a593Smuzhiyun (*mm_obj)->range_end = find_next_zero_bit(
102*4882a593Smuzhiyun mm->bitmap, mm->total_chunks, ++found);
103*4882a593Smuzhiyun /*
104*4882a593Smuzhiyun * If next free chunk is not contiguous than we need to
105*4882a593Smuzhiyun * restart our search from the last free chunk we found (which
106*4882a593Smuzhiyun * wasn't contiguous to the previous ones
107*4882a593Smuzhiyun */
108*4882a593Smuzhiyun if ((*mm_obj)->range_end != found) {
109*4882a593Smuzhiyun start_search = found;
110*4882a593Smuzhiyun goto mm_restart_search;
111*4882a593Smuzhiyun }
112*4882a593Smuzhiyun
113*4882a593Smuzhiyun /*
114*4882a593Smuzhiyun * If we reached end of buffer, bail out with error
115*4882a593Smuzhiyun */
116*4882a593Smuzhiyun if (found == mm->total_chunks)
117*4882a593Smuzhiyun goto mm_no_free_chunk;
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun /* Check if we don't need another chunk */
120*4882a593Smuzhiyun if (cur_size <= mm->chunk_size)
121*4882a593Smuzhiyun cur_size = 0;
122*4882a593Smuzhiyun else
123*4882a593Smuzhiyun cur_size -= mm->chunk_size;
124*4882a593Smuzhiyun
125*4882a593Smuzhiyun } while (cur_size > 0);
126*4882a593Smuzhiyun
127*4882a593Smuzhiyun /* Mark the chunks as allocated */
128*4882a593Smuzhiyun for (found = (*mm_obj)->range_start; found <= (*mm_obj)->range_end;
129*4882a593Smuzhiyun found++)
130*4882a593Smuzhiyun set_bit(found, mm->bitmap);
131*4882a593Smuzhiyun
132*4882a593Smuzhiyun mm_out:
133*4882a593Smuzhiyun mm->free_chunks -= ((*mm_obj)->range_end - (*mm_obj)->range_start + 1);
134*4882a593Smuzhiyun mutex_unlock(&mm->lock);
135*4882a593Smuzhiyun
136*4882a593Smuzhiyun LOG_DEBUG("mm allocate, mm_obj: %p, range_start: %d, range_end: %d\n",
137*4882a593Smuzhiyun *mm_obj, (*mm_obj)->range_start, (*mm_obj)->range_end);
138*4882a593Smuzhiyun
139*4882a593Smuzhiyun return 0;
140*4882a593Smuzhiyun
141*4882a593Smuzhiyun mm_no_free_chunk:
142*4882a593Smuzhiyun mutex_unlock(&mm->lock);
143*4882a593Smuzhiyun kfree(*mm_obj);
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun return -ENOMEM;
146*4882a593Smuzhiyun }
147*4882a593Smuzhiyun
rknpu_mm_free(struct rknpu_mm * mm,struct rknpu_mm_obj * mm_obj)148*4882a593Smuzhiyun int rknpu_mm_free(struct rknpu_mm *mm, struct rknpu_mm_obj *mm_obj)
149*4882a593Smuzhiyun {
150*4882a593Smuzhiyun unsigned int bit;
151*4882a593Smuzhiyun
152*4882a593Smuzhiyun /* Act like kfree when trying to free a NULL object */
153*4882a593Smuzhiyun if (!mm_obj)
154*4882a593Smuzhiyun return 0;
155*4882a593Smuzhiyun
156*4882a593Smuzhiyun LOG_DEBUG("mm free, mem_obj: %p, range_start: %d, range_end: %d\n",
157*4882a593Smuzhiyun mm_obj, mm_obj->range_start, mm_obj->range_end);
158*4882a593Smuzhiyun
159*4882a593Smuzhiyun mutex_lock(&mm->lock);
160*4882a593Smuzhiyun
161*4882a593Smuzhiyun /* Mark the chunks as free */
162*4882a593Smuzhiyun for (bit = mm_obj->range_start; bit <= mm_obj->range_end; bit++)
163*4882a593Smuzhiyun clear_bit(bit, mm->bitmap);
164*4882a593Smuzhiyun
165*4882a593Smuzhiyun mm->free_chunks += (mm_obj->range_end - mm_obj->range_start + 1);
166*4882a593Smuzhiyun
167*4882a593Smuzhiyun mutex_unlock(&mm->lock);
168*4882a593Smuzhiyun
169*4882a593Smuzhiyun kfree(mm_obj);
170*4882a593Smuzhiyun
171*4882a593Smuzhiyun return 0;
172*4882a593Smuzhiyun }
173*4882a593Smuzhiyun
rknpu_mm_dump(struct seq_file * m,void * data)174*4882a593Smuzhiyun int rknpu_mm_dump(struct seq_file *m, void *data)
175*4882a593Smuzhiyun {
176*4882a593Smuzhiyun struct rknpu_debugger_node *node = m->private;
177*4882a593Smuzhiyun struct rknpu_debugger *debugger = node->debugger;
178*4882a593Smuzhiyun struct rknpu_device *rknpu_dev =
179*4882a593Smuzhiyun container_of(debugger, struct rknpu_device, debugger);
180*4882a593Smuzhiyun struct rknpu_mm *mm = NULL;
181*4882a593Smuzhiyun int cur = 0, rbot = 0, rtop = 0;
182*4882a593Smuzhiyun size_t ret = 0;
183*4882a593Smuzhiyun char buf[64];
184*4882a593Smuzhiyun size_t size = sizeof(buf);
185*4882a593Smuzhiyun int seg_chunks = 32, seg_id = 0;
186*4882a593Smuzhiyun int free_size = 0;
187*4882a593Smuzhiyun int i = 0;
188*4882a593Smuzhiyun
189*4882a593Smuzhiyun mm = rknpu_dev->sram_mm;
190*4882a593Smuzhiyun if (mm == NULL)
191*4882a593Smuzhiyun return 0;
192*4882a593Smuzhiyun
193*4882a593Smuzhiyun seq_printf(m, "SRAM bitmap: \"*\" - used, \".\" - free (1bit = %dKB)\n",
194*4882a593Smuzhiyun mm->chunk_size / 1024);
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun rbot = cur = find_first_bit(mm->bitmap, mm->total_chunks);
197*4882a593Smuzhiyun for (i = 0; i < cur; ++i) {
198*4882a593Smuzhiyun ret += scnprintf(buf + ret, size - ret, ".");
199*4882a593Smuzhiyun if (ret >= seg_chunks) {
200*4882a593Smuzhiyun seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
201*4882a593Smuzhiyun ret = 0;
202*4882a593Smuzhiyun }
203*4882a593Smuzhiyun }
204*4882a593Smuzhiyun while (cur < mm->total_chunks) {
205*4882a593Smuzhiyun rtop = cur;
206*4882a593Smuzhiyun cur = find_next_bit(mm->bitmap, mm->total_chunks, cur + 1);
207*4882a593Smuzhiyun if (cur < mm->total_chunks && cur <= rtop + 1)
208*4882a593Smuzhiyun continue;
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun for (i = rbot; i <= rtop; ++i) {
211*4882a593Smuzhiyun ret += scnprintf(buf + ret, size - ret, "*");
212*4882a593Smuzhiyun if (ret >= seg_chunks) {
213*4882a593Smuzhiyun seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
214*4882a593Smuzhiyun ret = 0;
215*4882a593Smuzhiyun }
216*4882a593Smuzhiyun }
217*4882a593Smuzhiyun
218*4882a593Smuzhiyun for (i = rtop + 1; i < cur; ++i) {
219*4882a593Smuzhiyun ret += scnprintf(buf + ret, size - ret, ".");
220*4882a593Smuzhiyun if (ret >= seg_chunks) {
221*4882a593Smuzhiyun seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
222*4882a593Smuzhiyun ret = 0;
223*4882a593Smuzhiyun }
224*4882a593Smuzhiyun }
225*4882a593Smuzhiyun
226*4882a593Smuzhiyun rbot = cur;
227*4882a593Smuzhiyun }
228*4882a593Smuzhiyun
229*4882a593Smuzhiyun if (ret > 0)
230*4882a593Smuzhiyun seq_printf(m, "[%03d] [%s]\n", seg_id++, buf);
231*4882a593Smuzhiyun
232*4882a593Smuzhiyun free_size = mm->free_chunks * mm->chunk_size;
233*4882a593Smuzhiyun seq_printf(m, "SRAM total size: %d, used: %d, free: %d\n",
234*4882a593Smuzhiyun rknpu_dev->sram_size, rknpu_dev->sram_size - free_size,
235*4882a593Smuzhiyun free_size);
236*4882a593Smuzhiyun
237*4882a593Smuzhiyun return 0;
238*4882a593Smuzhiyun }
239