1*4882a593Smuzhiyun // SPDX-License-Identifier: GPL-2.0
2*4882a593Smuzhiyun /*
3*4882a593Smuzhiyun * Data verification functions, i.e. hooks for ->readpages()
4*4882a593Smuzhiyun *
5*4882a593Smuzhiyun * Copyright 2019 Google LLC
6*4882a593Smuzhiyun */
7*4882a593Smuzhiyun
8*4882a593Smuzhiyun #include "fsverity_private.h"
9*4882a593Smuzhiyun
10*4882a593Smuzhiyun #include <crypto/hash.h>
11*4882a593Smuzhiyun #include <linux/bio.h>
12*4882a593Smuzhiyun #include <linux/ratelimit.h>
13*4882a593Smuzhiyun
14*4882a593Smuzhiyun static struct workqueue_struct *fsverity_read_workqueue;
15*4882a593Smuzhiyun
16*4882a593Smuzhiyun /**
17*4882a593Smuzhiyun * hash_at_level() - compute the location of the block's hash at the given level
18*4882a593Smuzhiyun *
19*4882a593Smuzhiyun * @params: (in) the Merkle tree parameters
20*4882a593Smuzhiyun * @dindex: (in) the index of the data block being verified
21*4882a593Smuzhiyun * @level: (in) the level of hash we want (0 is leaf level)
22*4882a593Smuzhiyun * @hindex: (out) the index of the hash block containing the wanted hash
23*4882a593Smuzhiyun * @hoffset: (out) the byte offset to the wanted hash within the hash block
24*4882a593Smuzhiyun */
hash_at_level(const struct merkle_tree_params * params,pgoff_t dindex,unsigned int level,pgoff_t * hindex,unsigned int * hoffset)25*4882a593Smuzhiyun static void hash_at_level(const struct merkle_tree_params *params,
26*4882a593Smuzhiyun pgoff_t dindex, unsigned int level, pgoff_t *hindex,
27*4882a593Smuzhiyun unsigned int *hoffset)
28*4882a593Smuzhiyun {
29*4882a593Smuzhiyun pgoff_t position;
30*4882a593Smuzhiyun
31*4882a593Smuzhiyun /* Offset of the hash within the level's region, in hashes */
32*4882a593Smuzhiyun position = dindex >> (level * params->log_arity);
33*4882a593Smuzhiyun
34*4882a593Smuzhiyun /* Index of the hash block in the tree overall */
35*4882a593Smuzhiyun *hindex = params->level_start[level] + (position >> params->log_arity);
36*4882a593Smuzhiyun
37*4882a593Smuzhiyun /* Offset of the wanted hash (in bytes) within the hash block */
38*4882a593Smuzhiyun *hoffset = (position & ((1 << params->log_arity) - 1)) <<
39*4882a593Smuzhiyun (params->log_blocksize - params->log_arity);
40*4882a593Smuzhiyun }
41*4882a593Smuzhiyun
42*4882a593Smuzhiyun /* Extract a hash from a hash page */
extract_hash(struct page * hpage,unsigned int hoffset,unsigned int hsize,u8 * out)43*4882a593Smuzhiyun static void extract_hash(struct page *hpage, unsigned int hoffset,
44*4882a593Smuzhiyun unsigned int hsize, u8 *out)
45*4882a593Smuzhiyun {
46*4882a593Smuzhiyun void *virt = kmap_atomic(hpage);
47*4882a593Smuzhiyun
48*4882a593Smuzhiyun memcpy(out, virt + hoffset, hsize);
49*4882a593Smuzhiyun kunmap_atomic(virt);
50*4882a593Smuzhiyun }
51*4882a593Smuzhiyun
cmp_hashes(const struct fsverity_info * vi,const u8 * want_hash,const u8 * real_hash,pgoff_t index,int level)52*4882a593Smuzhiyun static inline int cmp_hashes(const struct fsverity_info *vi,
53*4882a593Smuzhiyun const u8 *want_hash, const u8 *real_hash,
54*4882a593Smuzhiyun pgoff_t index, int level)
55*4882a593Smuzhiyun {
56*4882a593Smuzhiyun const unsigned int hsize = vi->tree_params.digest_size;
57*4882a593Smuzhiyun
58*4882a593Smuzhiyun if (memcmp(want_hash, real_hash, hsize) == 0)
59*4882a593Smuzhiyun return 0;
60*4882a593Smuzhiyun
61*4882a593Smuzhiyun fsverity_err(vi->inode,
62*4882a593Smuzhiyun "FILE CORRUPTED! index=%lu, level=%d, want_hash=%s:%*phN, real_hash=%s:%*phN",
63*4882a593Smuzhiyun index, level,
64*4882a593Smuzhiyun vi->tree_params.hash_alg->name, hsize, want_hash,
65*4882a593Smuzhiyun vi->tree_params.hash_alg->name, hsize, real_hash);
66*4882a593Smuzhiyun return -EBADMSG;
67*4882a593Smuzhiyun }
68*4882a593Smuzhiyun
69*4882a593Smuzhiyun /*
70*4882a593Smuzhiyun * Verify a single data page against the file's Merkle tree.
71*4882a593Smuzhiyun *
72*4882a593Smuzhiyun * In principle, we need to verify the entire path to the root node. However,
73*4882a593Smuzhiyun * for efficiency the filesystem may cache the hash pages. Therefore we need
74*4882a593Smuzhiyun * only ascend the tree until an already-verified page is seen, as indicated by
75*4882a593Smuzhiyun * the PageChecked bit being set; then verify the path to that page.
76*4882a593Smuzhiyun *
77*4882a593Smuzhiyun * This code currently only supports the case where the verity block size is
78*4882a593Smuzhiyun * equal to PAGE_SIZE. Doing otherwise would be possible but tricky, since we
79*4882a593Smuzhiyun * wouldn't be able to use the PageChecked bit.
80*4882a593Smuzhiyun *
81*4882a593Smuzhiyun * Note that multiple processes may race to verify a hash page and mark it
82*4882a593Smuzhiyun * Checked, but it doesn't matter; the result will be the same either way.
83*4882a593Smuzhiyun *
84*4882a593Smuzhiyun * Return: true if the page is valid, else false.
85*4882a593Smuzhiyun */
verify_page(struct inode * inode,const struct fsverity_info * vi,struct ahash_request * req,struct page * data_page,unsigned long level0_ra_pages)86*4882a593Smuzhiyun static bool verify_page(struct inode *inode, const struct fsverity_info *vi,
87*4882a593Smuzhiyun struct ahash_request *req, struct page *data_page,
88*4882a593Smuzhiyun unsigned long level0_ra_pages)
89*4882a593Smuzhiyun {
90*4882a593Smuzhiyun const struct merkle_tree_params *params = &vi->tree_params;
91*4882a593Smuzhiyun const unsigned int hsize = params->digest_size;
92*4882a593Smuzhiyun const pgoff_t index = data_page->index;
93*4882a593Smuzhiyun int level;
94*4882a593Smuzhiyun u8 _want_hash[FS_VERITY_MAX_DIGEST_SIZE];
95*4882a593Smuzhiyun const u8 *want_hash;
96*4882a593Smuzhiyun u8 real_hash[FS_VERITY_MAX_DIGEST_SIZE];
97*4882a593Smuzhiyun struct page *hpages[FS_VERITY_MAX_LEVELS];
98*4882a593Smuzhiyun unsigned int hoffsets[FS_VERITY_MAX_LEVELS];
99*4882a593Smuzhiyun int err;
100*4882a593Smuzhiyun
101*4882a593Smuzhiyun if (WARN_ON_ONCE(!PageLocked(data_page) || PageUptodate(data_page)))
102*4882a593Smuzhiyun return false;
103*4882a593Smuzhiyun
104*4882a593Smuzhiyun pr_debug_ratelimited("Verifying data page %lu...\n", index);
105*4882a593Smuzhiyun
106*4882a593Smuzhiyun /*
107*4882a593Smuzhiyun * Starting at the leaf level, ascend the tree saving hash pages along
108*4882a593Smuzhiyun * the way until we find a verified hash page, indicated by PageChecked;
109*4882a593Smuzhiyun * or until we reach the root.
110*4882a593Smuzhiyun */
111*4882a593Smuzhiyun for (level = 0; level < params->num_levels; level++) {
112*4882a593Smuzhiyun pgoff_t hindex;
113*4882a593Smuzhiyun unsigned int hoffset;
114*4882a593Smuzhiyun struct page *hpage;
115*4882a593Smuzhiyun
116*4882a593Smuzhiyun hash_at_level(params, index, level, &hindex, &hoffset);
117*4882a593Smuzhiyun
118*4882a593Smuzhiyun pr_debug_ratelimited("Level %d: hindex=%lu, hoffset=%u\n",
119*4882a593Smuzhiyun level, hindex, hoffset);
120*4882a593Smuzhiyun
121*4882a593Smuzhiyun hpage = inode->i_sb->s_vop->read_merkle_tree_page(inode, hindex,
122*4882a593Smuzhiyun level == 0 ? level0_ra_pages : 0);
123*4882a593Smuzhiyun if (IS_ERR(hpage)) {
124*4882a593Smuzhiyun err = PTR_ERR(hpage);
125*4882a593Smuzhiyun fsverity_err(inode,
126*4882a593Smuzhiyun "Error %d reading Merkle tree page %lu",
127*4882a593Smuzhiyun err, hindex);
128*4882a593Smuzhiyun goto out;
129*4882a593Smuzhiyun }
130*4882a593Smuzhiyun
131*4882a593Smuzhiyun if (PageChecked(hpage)) {
132*4882a593Smuzhiyun extract_hash(hpage, hoffset, hsize, _want_hash);
133*4882a593Smuzhiyun want_hash = _want_hash;
134*4882a593Smuzhiyun put_page(hpage);
135*4882a593Smuzhiyun pr_debug_ratelimited("Hash page already checked, want %s:%*phN\n",
136*4882a593Smuzhiyun params->hash_alg->name,
137*4882a593Smuzhiyun hsize, want_hash);
138*4882a593Smuzhiyun goto descend;
139*4882a593Smuzhiyun }
140*4882a593Smuzhiyun pr_debug_ratelimited("Hash page not yet checked\n");
141*4882a593Smuzhiyun hpages[level] = hpage;
142*4882a593Smuzhiyun hoffsets[level] = hoffset;
143*4882a593Smuzhiyun }
144*4882a593Smuzhiyun
145*4882a593Smuzhiyun want_hash = vi->root_hash;
146*4882a593Smuzhiyun pr_debug("Want root hash: %s:%*phN\n",
147*4882a593Smuzhiyun params->hash_alg->name, hsize, want_hash);
148*4882a593Smuzhiyun descend:
149*4882a593Smuzhiyun /* Descend the tree verifying hash pages */
150*4882a593Smuzhiyun for (; level > 0; level--) {
151*4882a593Smuzhiyun struct page *hpage = hpages[level - 1];
152*4882a593Smuzhiyun unsigned int hoffset = hoffsets[level - 1];
153*4882a593Smuzhiyun
154*4882a593Smuzhiyun err = fsverity_hash_page(params, inode, req, hpage, real_hash);
155*4882a593Smuzhiyun if (err)
156*4882a593Smuzhiyun goto out;
157*4882a593Smuzhiyun err = cmp_hashes(vi, want_hash, real_hash, index, level - 1);
158*4882a593Smuzhiyun if (err)
159*4882a593Smuzhiyun goto out;
160*4882a593Smuzhiyun SetPageChecked(hpage);
161*4882a593Smuzhiyun extract_hash(hpage, hoffset, hsize, _want_hash);
162*4882a593Smuzhiyun want_hash = _want_hash;
163*4882a593Smuzhiyun put_page(hpage);
164*4882a593Smuzhiyun pr_debug("Verified hash page at level %d, now want %s:%*phN\n",
165*4882a593Smuzhiyun level - 1, params->hash_alg->name, hsize, want_hash);
166*4882a593Smuzhiyun }
167*4882a593Smuzhiyun
168*4882a593Smuzhiyun /* Finally, verify the data page */
169*4882a593Smuzhiyun err = fsverity_hash_page(params, inode, req, data_page, real_hash);
170*4882a593Smuzhiyun if (err)
171*4882a593Smuzhiyun goto out;
172*4882a593Smuzhiyun err = cmp_hashes(vi, want_hash, real_hash, index, -1);
173*4882a593Smuzhiyun out:
174*4882a593Smuzhiyun for (; level > 0; level--)
175*4882a593Smuzhiyun put_page(hpages[level - 1]);
176*4882a593Smuzhiyun
177*4882a593Smuzhiyun return err == 0;
178*4882a593Smuzhiyun }
179*4882a593Smuzhiyun
180*4882a593Smuzhiyun /**
181*4882a593Smuzhiyun * fsverity_verify_page() - verify a data page
182*4882a593Smuzhiyun * @page: the page to verity
183*4882a593Smuzhiyun *
184*4882a593Smuzhiyun * Verify a page that has just been read from a verity file. The page must be a
185*4882a593Smuzhiyun * pagecache page that is still locked and not yet uptodate.
186*4882a593Smuzhiyun *
187*4882a593Smuzhiyun * Return: true if the page is valid, else false.
188*4882a593Smuzhiyun */
fsverity_verify_page(struct page * page)189*4882a593Smuzhiyun bool fsverity_verify_page(struct page *page)
190*4882a593Smuzhiyun {
191*4882a593Smuzhiyun struct inode *inode = page->mapping->host;
192*4882a593Smuzhiyun const struct fsverity_info *vi = inode->i_verity_info;
193*4882a593Smuzhiyun struct ahash_request *req;
194*4882a593Smuzhiyun bool valid;
195*4882a593Smuzhiyun
196*4882a593Smuzhiyun /* This allocation never fails, since it's mempool-backed. */
197*4882a593Smuzhiyun req = fsverity_alloc_hash_request(vi->tree_params.hash_alg, GFP_NOFS);
198*4882a593Smuzhiyun
199*4882a593Smuzhiyun valid = verify_page(inode, vi, req, page, 0);
200*4882a593Smuzhiyun
201*4882a593Smuzhiyun fsverity_free_hash_request(vi->tree_params.hash_alg, req);
202*4882a593Smuzhiyun
203*4882a593Smuzhiyun return valid;
204*4882a593Smuzhiyun }
205*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(fsverity_verify_page);
206*4882a593Smuzhiyun
207*4882a593Smuzhiyun #ifdef CONFIG_BLOCK
208*4882a593Smuzhiyun /**
209*4882a593Smuzhiyun * fsverity_verify_bio() - verify a 'read' bio that has just completed
210*4882a593Smuzhiyun * @bio: the bio to verify
211*4882a593Smuzhiyun *
212*4882a593Smuzhiyun * Verify a set of pages that have just been read from a verity file. The pages
213*4882a593Smuzhiyun * must be pagecache pages that are still locked and not yet uptodate. Pages
214*4882a593Smuzhiyun * that fail verification are set to the Error state. Verification is skipped
215*4882a593Smuzhiyun * for pages already in the Error state, e.g. due to fscrypt decryption failure.
216*4882a593Smuzhiyun *
217*4882a593Smuzhiyun * This is a helper function for use by the ->readpages() method of filesystems
218*4882a593Smuzhiyun * that issue bios to read data directly into the page cache. Filesystems that
219*4882a593Smuzhiyun * populate the page cache without issuing bios (e.g. non block-based
220*4882a593Smuzhiyun * filesystems) must instead call fsverity_verify_page() directly on each page.
221*4882a593Smuzhiyun * All filesystems must also call fsverity_verify_page() on holes.
222*4882a593Smuzhiyun */
fsverity_verify_bio(struct bio * bio)223*4882a593Smuzhiyun void fsverity_verify_bio(struct bio *bio)
224*4882a593Smuzhiyun {
225*4882a593Smuzhiyun struct inode *inode = bio_first_page_all(bio)->mapping->host;
226*4882a593Smuzhiyun const struct fsverity_info *vi = inode->i_verity_info;
227*4882a593Smuzhiyun const struct merkle_tree_params *params = &vi->tree_params;
228*4882a593Smuzhiyun struct ahash_request *req;
229*4882a593Smuzhiyun struct bio_vec *bv;
230*4882a593Smuzhiyun struct bvec_iter_all iter_all;
231*4882a593Smuzhiyun unsigned long max_ra_pages = 0;
232*4882a593Smuzhiyun
233*4882a593Smuzhiyun /* This allocation never fails, since it's mempool-backed. */
234*4882a593Smuzhiyun req = fsverity_alloc_hash_request(params->hash_alg, GFP_NOFS);
235*4882a593Smuzhiyun
236*4882a593Smuzhiyun if (bio->bi_opf & REQ_RAHEAD) {
237*4882a593Smuzhiyun /*
238*4882a593Smuzhiyun * If this bio is for data readahead, then we also do readahead
239*4882a593Smuzhiyun * of the first (largest) level of the Merkle tree. Namely,
240*4882a593Smuzhiyun * when a Merkle tree page is read, we also try to piggy-back on
241*4882a593Smuzhiyun * some additional pages -- up to 1/4 the number of data pages.
242*4882a593Smuzhiyun *
243*4882a593Smuzhiyun * This improves sequential read performance, as it greatly
244*4882a593Smuzhiyun * reduces the number of I/O requests made to the Merkle tree.
245*4882a593Smuzhiyun */
246*4882a593Smuzhiyun bio_for_each_segment_all(bv, bio, iter_all)
247*4882a593Smuzhiyun max_ra_pages++;
248*4882a593Smuzhiyun max_ra_pages /= 4;
249*4882a593Smuzhiyun }
250*4882a593Smuzhiyun
251*4882a593Smuzhiyun bio_for_each_segment_all(bv, bio, iter_all) {
252*4882a593Smuzhiyun struct page *page = bv->bv_page;
253*4882a593Smuzhiyun unsigned long level0_index = page->index >> params->log_arity;
254*4882a593Smuzhiyun unsigned long level0_ra_pages =
255*4882a593Smuzhiyun min(max_ra_pages, params->level0_blocks - level0_index);
256*4882a593Smuzhiyun
257*4882a593Smuzhiyun if (!PageError(page) &&
258*4882a593Smuzhiyun !verify_page(inode, vi, req, page, level0_ra_pages))
259*4882a593Smuzhiyun SetPageError(page);
260*4882a593Smuzhiyun }
261*4882a593Smuzhiyun
262*4882a593Smuzhiyun fsverity_free_hash_request(params->hash_alg, req);
263*4882a593Smuzhiyun }
264*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(fsverity_verify_bio);
265*4882a593Smuzhiyun #endif /* CONFIG_BLOCK */
266*4882a593Smuzhiyun
267*4882a593Smuzhiyun /**
268*4882a593Smuzhiyun * fsverity_enqueue_verify_work() - enqueue work on the fs-verity workqueue
269*4882a593Smuzhiyun * @work: the work to enqueue
270*4882a593Smuzhiyun *
271*4882a593Smuzhiyun * Enqueue verification work for asynchronous processing.
272*4882a593Smuzhiyun */
fsverity_enqueue_verify_work(struct work_struct * work)273*4882a593Smuzhiyun void fsverity_enqueue_verify_work(struct work_struct *work)
274*4882a593Smuzhiyun {
275*4882a593Smuzhiyun queue_work(fsverity_read_workqueue, work);
276*4882a593Smuzhiyun }
277*4882a593Smuzhiyun EXPORT_SYMBOL_GPL(fsverity_enqueue_verify_work);
278*4882a593Smuzhiyun
fsverity_init_workqueue(void)279*4882a593Smuzhiyun int __init fsverity_init_workqueue(void)
280*4882a593Smuzhiyun {
281*4882a593Smuzhiyun /*
282*4882a593Smuzhiyun * Use an unbound workqueue to allow bios to be verified in parallel
283*4882a593Smuzhiyun * even when they happen to complete on the same CPU. This sacrifices
284*4882a593Smuzhiyun * locality, but it's worthwhile since hashing is CPU-intensive.
285*4882a593Smuzhiyun *
286*4882a593Smuzhiyun * Also use a high-priority workqueue to prioritize verification work,
287*4882a593Smuzhiyun * which blocks reads from completing, over regular application tasks.
288*4882a593Smuzhiyun */
289*4882a593Smuzhiyun fsverity_read_workqueue = alloc_workqueue("fsverity_read_queue",
290*4882a593Smuzhiyun WQ_UNBOUND | WQ_HIGHPRI,
291*4882a593Smuzhiyun num_online_cpus());
292*4882a593Smuzhiyun if (!fsverity_read_workqueue)
293*4882a593Smuzhiyun return -ENOMEM;
294*4882a593Smuzhiyun return 0;
295*4882a593Smuzhiyun }
296*4882a593Smuzhiyun
fsverity_exit_workqueue(void)297*4882a593Smuzhiyun void __init fsverity_exit_workqueue(void)
298*4882a593Smuzhiyun {
299*4882a593Smuzhiyun destroy_workqueue(fsverity_read_workqueue);
300*4882a593Smuzhiyun fsverity_read_workqueue = NULL;
301*4882a593Smuzhiyun }
302