1*4882a593Smuzhiyun /* SPDX-License-Identifier: GPL-2.0-or-later */
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Copyright (C) International Business Machines Corp., 2000-2002
4*4882a593Smuzhiyun */
5*4882a593Smuzhiyun #ifndef _H_JFS_DMAP
6*4882a593Smuzhiyun #define _H_JFS_DMAP
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include "jfs_txnmgr.h"
9*4882a593Smuzhiyun
10*4882a593Smuzhiyun #define BMAPVERSION 1 /* version number */
11*4882a593Smuzhiyun #define TREESIZE (256+64+16+4+1) /* size of a dmap tree */
12*4882a593Smuzhiyun #define LEAFIND (64+16+4+1) /* index of 1st leaf of a dmap tree */
13*4882a593Smuzhiyun #define LPERDMAP 256 /* num leaves per dmap tree */
14*4882a593Smuzhiyun #define L2LPERDMAP 8 /* l2 number of leaves per dmap tree */
15*4882a593Smuzhiyun #define DBWORD 32 /* # of blks covered by a map word */
16*4882a593Smuzhiyun #define L2DBWORD 5 /* l2 # of blks covered by a mword */
17*4882a593Smuzhiyun #define BUDMIN L2DBWORD /* max free string in a map word */
18*4882a593Smuzhiyun #define BPERDMAP (LPERDMAP * DBWORD) /* num of blks per dmap */
19*4882a593Smuzhiyun #define L2BPERDMAP 13 /* l2 num of blks per dmap */
20*4882a593Smuzhiyun #define CTLTREESIZE (1024+256+64+16+4+1) /* size of a dmapctl tree */
21*4882a593Smuzhiyun #define CTLLEAFIND (256+64+16+4+1) /* idx of 1st leaf of a dmapctl tree */
22*4882a593Smuzhiyun #define LPERCTL 1024 /* num of leaves per dmapctl tree */
23*4882a593Smuzhiyun #define L2LPERCTL 10 /* l2 num of leaves per dmapctl tree */
24*4882a593Smuzhiyun #define ROOT 0 /* index of the root of a tree */
25*4882a593Smuzhiyun #define NOFREE ((s8) -1) /* no blocks free */
26*4882a593Smuzhiyun #define MAXAG 128 /* max number of allocation groups */
27*4882a593Smuzhiyun #define L2MAXAG 7 /* l2 max num of AG */
28*4882a593Smuzhiyun #define L2MINAGSZ 25 /* l2 of minimum AG size in bytes */
29*4882a593Smuzhiyun #define BMAPBLKNO 0 /* lblkno of bmap within the map */
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun /*
32*4882a593Smuzhiyun * maximum l2 number of disk blocks at the various dmapctl levels.
33*4882a593Smuzhiyun */
34*4882a593Smuzhiyun #define L2MAXL0SIZE (L2BPERDMAP + 1 * L2LPERCTL)
35*4882a593Smuzhiyun #define L2MAXL1SIZE (L2BPERDMAP + 2 * L2LPERCTL)
36*4882a593Smuzhiyun #define L2MAXL2SIZE (L2BPERDMAP + 3 * L2LPERCTL)
37*4882a593Smuzhiyun
38*4882a593Smuzhiyun /*
39*4882a593Smuzhiyun * maximum number of disk blocks at the various dmapctl levels.
40*4882a593Smuzhiyun */
41*4882a593Smuzhiyun #define MAXL0SIZE ((s64)1 << L2MAXL0SIZE)
42*4882a593Smuzhiyun #define MAXL1SIZE ((s64)1 << L2MAXL1SIZE)
43*4882a593Smuzhiyun #define MAXL2SIZE ((s64)1 << L2MAXL2SIZE)
44*4882a593Smuzhiyun
45*4882a593Smuzhiyun #define MAXMAPSIZE MAXL2SIZE /* maximum aggregate map size */
46*4882a593Smuzhiyun
47*4882a593Smuzhiyun /*
48*4882a593Smuzhiyun * determine the maximum free string for four (lower level) nodes
49*4882a593Smuzhiyun * of the tree.
50*4882a593Smuzhiyun */
TREEMAX(signed char * cp)51*4882a593Smuzhiyun static inline signed char TREEMAX(signed char *cp)
52*4882a593Smuzhiyun {
53*4882a593Smuzhiyun signed char tmp1, tmp2;
54*4882a593Smuzhiyun
55*4882a593Smuzhiyun tmp1 = max(*(cp+2), *(cp+3));
56*4882a593Smuzhiyun tmp2 = max(*(cp), *(cp+1));
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun return max(tmp1, tmp2);
59*4882a593Smuzhiyun }
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun /*
62*4882a593Smuzhiyun * convert disk block number to the logical block number of the dmap
63*4882a593Smuzhiyun * describing the disk block. s is the log2(number of logical blocks per page)
64*4882a593Smuzhiyun *
65*4882a593Smuzhiyun * The calculation figures out how many logical pages are in front of the dmap.
66*4882a593Smuzhiyun * - the number of dmaps preceding it
67*4882a593Smuzhiyun * - the number of L0 pages preceding its L0 page
68*4882a593Smuzhiyun * - the number of L1 pages preceding its L1 page
69*4882a593Smuzhiyun * - 3 is added to account for the L2, L1, and L0 page for this dmap
70*4882a593Smuzhiyun * - 1 is added to account for the control page of the map.
71*4882a593Smuzhiyun */
72*4882a593Smuzhiyun #define BLKTODMAP(b,s) \
73*4882a593Smuzhiyun ((((b) >> 13) + ((b) >> 23) + ((b) >> 33) + 3 + 1) << (s))
74*4882a593Smuzhiyun
75*4882a593Smuzhiyun /*
76*4882a593Smuzhiyun * convert disk block number to the logical block number of the LEVEL 0
77*4882a593Smuzhiyun * dmapctl describing the disk block. s is the log2(number of logical blocks
78*4882a593Smuzhiyun * per page)
79*4882a593Smuzhiyun *
80*4882a593Smuzhiyun * The calculation figures out how many logical pages are in front of the L0.
81*4882a593Smuzhiyun * - the number of dmap pages preceding it
82*4882a593Smuzhiyun * - the number of L0 pages preceding it
83*4882a593Smuzhiyun * - the number of L1 pages preceding its L1 page
84*4882a593Smuzhiyun * - 2 is added to account for the L2, and L1 page for this L0
85*4882a593Smuzhiyun * - 1 is added to account for the control page of the map.
86*4882a593Smuzhiyun */
87*4882a593Smuzhiyun #define BLKTOL0(b,s) \
88*4882a593Smuzhiyun (((((b) >> 23) << 10) + ((b) >> 23) + ((b) >> 33) + 2 + 1) << (s))
89*4882a593Smuzhiyun
90*4882a593Smuzhiyun /*
91*4882a593Smuzhiyun * convert disk block number to the logical block number of the LEVEL 1
92*4882a593Smuzhiyun * dmapctl describing the disk block. s is the log2(number of logical blocks
93*4882a593Smuzhiyun * per page)
94*4882a593Smuzhiyun *
95*4882a593Smuzhiyun * The calculation figures out how many logical pages are in front of the L1.
96*4882a593Smuzhiyun * - the number of dmap pages preceding it
97*4882a593Smuzhiyun * - the number of L0 pages preceding it
98*4882a593Smuzhiyun * - the number of L1 pages preceding it
99*4882a593Smuzhiyun * - 1 is added to account for the L2 page
100*4882a593Smuzhiyun * - 1 is added to account for the control page of the map.
101*4882a593Smuzhiyun */
102*4882a593Smuzhiyun #define BLKTOL1(b,s) \
103*4882a593Smuzhiyun (((((b) >> 33) << 20) + (((b) >> 33) << 10) + ((b) >> 33) + 1 + 1) << (s))
104*4882a593Smuzhiyun
105*4882a593Smuzhiyun /*
106*4882a593Smuzhiyun * convert disk block number to the logical block number of the dmapctl
107*4882a593Smuzhiyun * at the specified level which describes the disk block.
108*4882a593Smuzhiyun */
109*4882a593Smuzhiyun #define BLKTOCTL(b,s,l) \
110*4882a593Smuzhiyun (((l) == 2) ? 1 : ((l) == 1) ? BLKTOL1((b),(s)) : BLKTOL0((b),(s)))
111*4882a593Smuzhiyun
112*4882a593Smuzhiyun /*
113*4882a593Smuzhiyun * convert aggregate map size to the zero origin dmapctl level of the
114*4882a593Smuzhiyun * top dmapctl.
115*4882a593Smuzhiyun */
116*4882a593Smuzhiyun #define BMAPSZTOLEV(size) \
117*4882a593Smuzhiyun (((size) <= MAXL0SIZE) ? 0 : ((size) <= MAXL1SIZE) ? 1 : 2)
118*4882a593Smuzhiyun
119*4882a593Smuzhiyun /* convert disk block number to allocation group number.
120*4882a593Smuzhiyun */
121*4882a593Smuzhiyun #define BLKTOAG(b,sbi) ((b) >> ((sbi)->bmap->db_agl2size))
122*4882a593Smuzhiyun
123*4882a593Smuzhiyun /* convert allocation group number to starting disk block
124*4882a593Smuzhiyun * number.
125*4882a593Smuzhiyun */
126*4882a593Smuzhiyun #define AGTOBLK(a,ip) \
127*4882a593Smuzhiyun ((s64)(a) << (JFS_SBI((ip)->i_sb)->bmap->db_agl2size))
128*4882a593Smuzhiyun
129*4882a593Smuzhiyun /*
130*4882a593Smuzhiyun * dmap summary tree
131*4882a593Smuzhiyun *
132*4882a593Smuzhiyun * dmaptree must be consistent with dmapctl.
133*4882a593Smuzhiyun */
134*4882a593Smuzhiyun struct dmaptree {
135*4882a593Smuzhiyun __le32 nleafs; /* 4: number of tree leafs */
136*4882a593Smuzhiyun __le32 l2nleafs; /* 4: l2 number of tree leafs */
137*4882a593Smuzhiyun __le32 leafidx; /* 4: index of first tree leaf */
138*4882a593Smuzhiyun __le32 height; /* 4: height of the tree */
139*4882a593Smuzhiyun s8 budmin; /* 1: min l2 tree leaf value to combine */
140*4882a593Smuzhiyun s8 stree[TREESIZE]; /* TREESIZE: tree */
141*4882a593Smuzhiyun u8 pad[2]; /* 2: pad to word boundary */
142*4882a593Smuzhiyun }; /* - 360 - */
143*4882a593Smuzhiyun
144*4882a593Smuzhiyun /*
145*4882a593Smuzhiyun * dmap page per 8K blocks bitmap
146*4882a593Smuzhiyun */
147*4882a593Smuzhiyun struct dmap {
148*4882a593Smuzhiyun __le32 nblocks; /* 4: num blks covered by this dmap */
149*4882a593Smuzhiyun __le32 nfree; /* 4: num of free blks in this dmap */
150*4882a593Smuzhiyun __le64 start; /* 8: starting blkno for this dmap */
151*4882a593Smuzhiyun struct dmaptree tree; /* 360: dmap tree */
152*4882a593Smuzhiyun u8 pad[1672]; /* 1672: pad to 2048 bytes */
153*4882a593Smuzhiyun __le32 wmap[LPERDMAP]; /* 1024: bits of the working map */
154*4882a593Smuzhiyun __le32 pmap[LPERDMAP]; /* 1024: bits of the persistent map */
155*4882a593Smuzhiyun }; /* - 4096 - */
156*4882a593Smuzhiyun
157*4882a593Smuzhiyun /*
158*4882a593Smuzhiyun * disk map control page per level.
159*4882a593Smuzhiyun *
160*4882a593Smuzhiyun * dmapctl must be consistent with dmaptree.
161*4882a593Smuzhiyun */
162*4882a593Smuzhiyun struct dmapctl {
163*4882a593Smuzhiyun __le32 nleafs; /* 4: number of tree leafs */
164*4882a593Smuzhiyun __le32 l2nleafs; /* 4: l2 number of tree leafs */
165*4882a593Smuzhiyun __le32 leafidx; /* 4: index of the first tree leaf */
166*4882a593Smuzhiyun __le32 height; /* 4: height of tree */
167*4882a593Smuzhiyun s8 budmin; /* 1: minimum l2 tree leaf value */
168*4882a593Smuzhiyun s8 stree[CTLTREESIZE]; /* CTLTREESIZE: dmapctl tree */
169*4882a593Smuzhiyun u8 pad[2714]; /* 2714: pad to 4096 */
170*4882a593Smuzhiyun }; /* - 4096 - */
171*4882a593Smuzhiyun
172*4882a593Smuzhiyun /*
173*4882a593Smuzhiyun * common definition for dmaptree within dmap and dmapctl
174*4882a593Smuzhiyun */
175*4882a593Smuzhiyun typedef union dmtree {
176*4882a593Smuzhiyun struct dmaptree t1;
177*4882a593Smuzhiyun struct dmapctl t2;
178*4882a593Smuzhiyun } dmtree_t;
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun /* macros for accessing fields within dmtree */
181*4882a593Smuzhiyun #define dmt_nleafs t1.nleafs
182*4882a593Smuzhiyun #define dmt_l2nleafs t1.l2nleafs
183*4882a593Smuzhiyun #define dmt_leafidx t1.leafidx
184*4882a593Smuzhiyun #define dmt_height t1.height
185*4882a593Smuzhiyun #define dmt_budmin t1.budmin
186*4882a593Smuzhiyun #define dmt_stree t2.stree
187*4882a593Smuzhiyun
188*4882a593Smuzhiyun /*
189*4882a593Smuzhiyun * on-disk aggregate disk allocation map descriptor.
190*4882a593Smuzhiyun */
191*4882a593Smuzhiyun struct dbmap_disk {
192*4882a593Smuzhiyun __le64 dn_mapsize; /* 8: number of blocks in aggregate */
193*4882a593Smuzhiyun __le64 dn_nfree; /* 8: num free blks in aggregate map */
194*4882a593Smuzhiyun __le32 dn_l2nbperpage; /* 4: number of blks per page */
195*4882a593Smuzhiyun __le32 dn_numag; /* 4: total number of ags */
196*4882a593Smuzhiyun __le32 dn_maxlevel; /* 4: number of active ags */
197*4882a593Smuzhiyun __le32 dn_maxag; /* 4: max active alloc group number */
198*4882a593Smuzhiyun __le32 dn_agpref; /* 4: preferred alloc group (hint) */
199*4882a593Smuzhiyun __le32 dn_aglevel; /* 4: dmapctl level holding the AG */
200*4882a593Smuzhiyun __le32 dn_agheight; /* 4: height in dmapctl of the AG */
201*4882a593Smuzhiyun __le32 dn_agwidth; /* 4: width in dmapctl of the AG */
202*4882a593Smuzhiyun __le32 dn_agstart; /* 4: start tree index at AG height */
203*4882a593Smuzhiyun __le32 dn_agl2size; /* 4: l2 num of blks per alloc group */
204*4882a593Smuzhiyun __le64 dn_agfree[MAXAG];/* 8*MAXAG: per AG free count */
205*4882a593Smuzhiyun __le64 dn_agsize; /* 8: num of blks per alloc group */
206*4882a593Smuzhiyun s8 dn_maxfreebud; /* 1: max free buddy system */
207*4882a593Smuzhiyun u8 pad[3007]; /* 3007: pad to 4096 */
208*4882a593Smuzhiyun }; /* - 4096 - */
209*4882a593Smuzhiyun
210*4882a593Smuzhiyun struct dbmap {
211*4882a593Smuzhiyun s64 dn_mapsize; /* number of blocks in aggregate */
212*4882a593Smuzhiyun s64 dn_nfree; /* num free blks in aggregate map */
213*4882a593Smuzhiyun int dn_l2nbperpage; /* number of blks per page */
214*4882a593Smuzhiyun int dn_numag; /* total number of ags */
215*4882a593Smuzhiyun int dn_maxlevel; /* number of active ags */
216*4882a593Smuzhiyun int dn_maxag; /* max active alloc group number */
217*4882a593Smuzhiyun int dn_agpref; /* preferred alloc group (hint) */
218*4882a593Smuzhiyun int dn_aglevel; /* dmapctl level holding the AG */
219*4882a593Smuzhiyun int dn_agheight; /* height in dmapctl of the AG */
220*4882a593Smuzhiyun int dn_agwidth; /* width in dmapctl of the AG */
221*4882a593Smuzhiyun int dn_agstart; /* start tree index at AG height */
222*4882a593Smuzhiyun int dn_agl2size; /* l2 num of blks per alloc group */
223*4882a593Smuzhiyun s64 dn_agfree[MAXAG]; /* per AG free count */
224*4882a593Smuzhiyun s64 dn_agsize; /* num of blks per alloc group */
225*4882a593Smuzhiyun signed char dn_maxfreebud; /* max free buddy system */
226*4882a593Smuzhiyun }; /* - 4096 - */
227*4882a593Smuzhiyun /*
228*4882a593Smuzhiyun * in-memory aggregate disk allocation map descriptor.
229*4882a593Smuzhiyun */
230*4882a593Smuzhiyun struct bmap {
231*4882a593Smuzhiyun struct dbmap db_bmap; /* on-disk aggregate map descriptor */
232*4882a593Smuzhiyun struct inode *db_ipbmap; /* ptr to aggregate map incore inode */
233*4882a593Smuzhiyun struct mutex db_bmaplock; /* aggregate map lock */
234*4882a593Smuzhiyun atomic_t db_active[MAXAG]; /* count of active, open files in AG */
235*4882a593Smuzhiyun u32 *db_DBmap;
236*4882a593Smuzhiyun };
237*4882a593Smuzhiyun
238*4882a593Smuzhiyun /* macros for accessing fields within in-memory aggregate map descriptor */
239*4882a593Smuzhiyun #define db_mapsize db_bmap.dn_mapsize
240*4882a593Smuzhiyun #define db_nfree db_bmap.dn_nfree
241*4882a593Smuzhiyun #define db_agfree db_bmap.dn_agfree
242*4882a593Smuzhiyun #define db_agsize db_bmap.dn_agsize
243*4882a593Smuzhiyun #define db_agl2size db_bmap.dn_agl2size
244*4882a593Smuzhiyun #define db_agwidth db_bmap.dn_agwidth
245*4882a593Smuzhiyun #define db_agheight db_bmap.dn_agheight
246*4882a593Smuzhiyun #define db_agstart db_bmap.dn_agstart
247*4882a593Smuzhiyun #define db_numag db_bmap.dn_numag
248*4882a593Smuzhiyun #define db_maxlevel db_bmap.dn_maxlevel
249*4882a593Smuzhiyun #define db_aglevel db_bmap.dn_aglevel
250*4882a593Smuzhiyun #define db_agpref db_bmap.dn_agpref
251*4882a593Smuzhiyun #define db_maxag db_bmap.dn_maxag
252*4882a593Smuzhiyun #define db_maxfreebud db_bmap.dn_maxfreebud
253*4882a593Smuzhiyun #define db_l2nbperpage db_bmap.dn_l2nbperpage
254*4882a593Smuzhiyun
255*4882a593Smuzhiyun /*
256*4882a593Smuzhiyun * macros for various conversions needed by the allocators.
257*4882a593Smuzhiyun * blkstol2(), cntlz(), and cnttz() are operating system dependent functions.
258*4882a593Smuzhiyun */
259*4882a593Smuzhiyun /* convert number of blocks to log2 number of blocks, rounding up to
260*4882a593Smuzhiyun * the next log2 value if blocks is not a l2 multiple.
261*4882a593Smuzhiyun */
262*4882a593Smuzhiyun #define BLKSTOL2(d) (blkstol2(d))
263*4882a593Smuzhiyun
264*4882a593Smuzhiyun /* convert number of leafs to log2 leaf value */
265*4882a593Smuzhiyun #define NLSTOL2BSZ(n) (31 - cntlz((n)) + BUDMIN)
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun /* convert leaf index to log2 leaf value */
268*4882a593Smuzhiyun #define LITOL2BSZ(n,m,b) ((((n) == 0) ? (m) : cnttz((n))) + (b))
269*4882a593Smuzhiyun
270*4882a593Smuzhiyun /* convert a block number to a dmap control leaf index */
271*4882a593Smuzhiyun #define BLKTOCTLLEAF(b,m) \
272*4882a593Smuzhiyun (((b) & (((s64)1 << ((m) + L2LPERCTL)) - 1)) >> (m))
273*4882a593Smuzhiyun
274*4882a593Smuzhiyun /* convert log2 leaf value to buddy size */
275*4882a593Smuzhiyun #define BUDSIZE(s,m) (1 << ((s) - (m)))
276*4882a593Smuzhiyun
277*4882a593Smuzhiyun /*
278*4882a593Smuzhiyun * external references.
279*4882a593Smuzhiyun */
280*4882a593Smuzhiyun extern int dbMount(struct inode *ipbmap);
281*4882a593Smuzhiyun
282*4882a593Smuzhiyun extern int dbUnmount(struct inode *ipbmap, int mounterror);
283*4882a593Smuzhiyun
284*4882a593Smuzhiyun extern int dbFree(struct inode *ipbmap, s64 blkno, s64 nblocks);
285*4882a593Smuzhiyun
286*4882a593Smuzhiyun extern int dbUpdatePMap(struct inode *ipbmap,
287*4882a593Smuzhiyun int free, s64 blkno, s64 nblocks, struct tblock * tblk);
288*4882a593Smuzhiyun
289*4882a593Smuzhiyun extern int dbNextAG(struct inode *ipbmap);
290*4882a593Smuzhiyun
291*4882a593Smuzhiyun extern int dbAlloc(struct inode *ipbmap, s64 hint, s64 nblocks, s64 * results);
292*4882a593Smuzhiyun
293*4882a593Smuzhiyun extern int dbReAlloc(struct inode *ipbmap,
294*4882a593Smuzhiyun s64 blkno, s64 nblocks, s64 addnblocks, s64 * results);
295*4882a593Smuzhiyun
296*4882a593Smuzhiyun extern int dbSync(struct inode *ipbmap);
297*4882a593Smuzhiyun extern int dbAllocBottomUp(struct inode *ip, s64 blkno, s64 nblocks);
298*4882a593Smuzhiyun extern int dbExtendFS(struct inode *ipbmap, s64 blkno, s64 nblocks);
299*4882a593Smuzhiyun extern void dbFinalizeBmap(struct inode *ipbmap);
300*4882a593Smuzhiyun extern s64 dbMapFileSizeToMapSize(struct inode *ipbmap);
301*4882a593Smuzhiyun extern s64 dbDiscardAG(struct inode *ip, int agno, s64 minlen);
302*4882a593Smuzhiyun
303*4882a593Smuzhiyun #endif /* _H_JFS_DMAP */
304