mirror of
https://mirrors.bfsu.edu.cn/git/linux.git
synced 2024-11-16 16:54:20 +08:00
98dc08bae6
As a step towards freeing the PG_error flag for other uses, change ext4 and f2fs to stop using PG_error to track verity errors. Instead, if a verity error occurs, just mark the whole bio as failed. The coarser granularity isn't really a problem since it isn't any worse than what the block layer provides, and errors from a multi-page readahead aren't reported to applications unless a single-page read fails too. f2fs supports compression, which makes the f2fs changes a bit more complicated than desired, but the basic premise still works. Note: there are still a few uses of PageError in f2fs, but they are on the write path, so they are unrelated and this patch doesn't touch them. Reviewed-by: Chao Yu <chao@kernel.org> Acked-by: Jaegeuk Kim <jaegeuk@kernel.org> Signed-off-by: Eric Biggers <ebiggers@google.com> Link: https://lore.kernel.org/r/20221129070401.156114-1-ebiggers@kernel.org
292 lines
9.3 KiB
C
292 lines
9.3 KiB
C
// SPDX-License-Identifier: GPL-2.0
|
|
/*
|
|
* Data verification functions, i.e. hooks for ->readahead()
|
|
*
|
|
* Copyright 2019 Google LLC
|
|
*/
|
|
|
|
#include "fsverity_private.h"
|
|
|
|
#include <crypto/hash.h>
|
|
#include <linux/bio.h>
|
|
#include <linux/ratelimit.h>
|
|
|
|
static struct workqueue_struct *fsverity_read_workqueue;
|
|
|
|
/**
|
|
* hash_at_level() - compute the location of the block's hash at the given level
|
|
*
|
|
* @params: (in) the Merkle tree parameters
|
|
* @dindex: (in) the index of the data block being verified
|
|
* @level: (in) the level of hash we want (0 is leaf level)
|
|
* @hindex: (out) the index of the hash block containing the wanted hash
|
|
* @hoffset: (out) the byte offset to the wanted hash within the hash block
|
|
*/
|
|
static void hash_at_level(const struct merkle_tree_params *params,
|
|
pgoff_t dindex, unsigned int level, pgoff_t *hindex,
|
|
unsigned int *hoffset)
|
|
{
|
|
pgoff_t position;
|
|
|
|
/* Offset of the hash within the level's region, in hashes */
|
|
position = dindex >> (level * params->log_arity);
|
|
|
|
/* Index of the hash block in the tree overall */
|
|
*hindex = params->level_start[level] + (position >> params->log_arity);
|
|
|
|
/* Offset of the wanted hash (in bytes) within the hash block */
|
|
*hoffset = (position & ((1 << params->log_arity) - 1)) <<
|
|
(params->log_blocksize - params->log_arity);
|
|
}
|
|
|
|
static inline int cmp_hashes(const struct fsverity_info *vi,
|
|
const u8 *want_hash, const u8 *real_hash,
|
|
pgoff_t index, int level)
|
|
{
|
|
const unsigned int hsize = vi->tree_params.digest_size;
|
|
|
|
if (memcmp(want_hash, real_hash, hsize) == 0)
|
|
return 0;
|
|
|
|
fsverity_err(vi->inode,
|
|
"FILE CORRUPTED! index=%lu, level=%d, want_hash=%s:%*phN, real_hash=%s:%*phN",
|
|
index, level,
|
|
vi->tree_params.hash_alg->name, hsize, want_hash,
|
|
vi->tree_params.hash_alg->name, hsize, real_hash);
|
|
return -EBADMSG;
|
|
}
|
|
|
|
/*
|
|
* Verify a single data page against the file's Merkle tree.
|
|
*
|
|
* In principle, we need to verify the entire path to the root node. However,
|
|
* for efficiency the filesystem may cache the hash pages. Therefore we need
|
|
* only ascend the tree until an already-verified page is seen, as indicated by
|
|
* the PageChecked bit being set; then verify the path to that page.
|
|
*
|
|
* This code currently only supports the case where the verity block size is
|
|
* equal to PAGE_SIZE. Doing otherwise would be possible but tricky, since we
|
|
* wouldn't be able to use the PageChecked bit.
|
|
*
|
|
* Note that multiple processes may race to verify a hash page and mark it
|
|
* Checked, but it doesn't matter; the result will be the same either way.
|
|
*
|
|
* Return: true if the page is valid, else false.
|
|
*/
|
|
static bool verify_page(struct inode *inode, const struct fsverity_info *vi,
|
|
struct ahash_request *req, struct page *data_page,
|
|
unsigned long level0_ra_pages)
|
|
{
|
|
const struct merkle_tree_params *params = &vi->tree_params;
|
|
const unsigned int hsize = params->digest_size;
|
|
const pgoff_t index = data_page->index;
|
|
int level;
|
|
u8 _want_hash[FS_VERITY_MAX_DIGEST_SIZE];
|
|
const u8 *want_hash;
|
|
u8 real_hash[FS_VERITY_MAX_DIGEST_SIZE];
|
|
struct page *hpages[FS_VERITY_MAX_LEVELS];
|
|
unsigned int hoffsets[FS_VERITY_MAX_LEVELS];
|
|
int err;
|
|
|
|
if (WARN_ON_ONCE(!PageLocked(data_page) || PageUptodate(data_page)))
|
|
return false;
|
|
|
|
pr_debug_ratelimited("Verifying data page %lu...\n", index);
|
|
|
|
/*
|
|
* Starting at the leaf level, ascend the tree saving hash pages along
|
|
* the way until we find a verified hash page, indicated by PageChecked;
|
|
* or until we reach the root.
|
|
*/
|
|
for (level = 0; level < params->num_levels; level++) {
|
|
pgoff_t hindex;
|
|
unsigned int hoffset;
|
|
struct page *hpage;
|
|
|
|
hash_at_level(params, index, level, &hindex, &hoffset);
|
|
|
|
pr_debug_ratelimited("Level %d: hindex=%lu, hoffset=%u\n",
|
|
level, hindex, hoffset);
|
|
|
|
hpage = inode->i_sb->s_vop->read_merkle_tree_page(inode, hindex,
|
|
level == 0 ? level0_ra_pages : 0);
|
|
if (IS_ERR(hpage)) {
|
|
err = PTR_ERR(hpage);
|
|
fsverity_err(inode,
|
|
"Error %d reading Merkle tree page %lu",
|
|
err, hindex);
|
|
goto out;
|
|
}
|
|
|
|
if (PageChecked(hpage)) {
|
|
memcpy_from_page(_want_hash, hpage, hoffset, hsize);
|
|
want_hash = _want_hash;
|
|
put_page(hpage);
|
|
pr_debug_ratelimited("Hash page already checked, want %s:%*phN\n",
|
|
params->hash_alg->name,
|
|
hsize, want_hash);
|
|
goto descend;
|
|
}
|
|
pr_debug_ratelimited("Hash page not yet checked\n");
|
|
hpages[level] = hpage;
|
|
hoffsets[level] = hoffset;
|
|
}
|
|
|
|
want_hash = vi->root_hash;
|
|
pr_debug("Want root hash: %s:%*phN\n",
|
|
params->hash_alg->name, hsize, want_hash);
|
|
descend:
|
|
/* Descend the tree verifying hash pages */
|
|
for (; level > 0; level--) {
|
|
struct page *hpage = hpages[level - 1];
|
|
unsigned int hoffset = hoffsets[level - 1];
|
|
|
|
err = fsverity_hash_page(params, inode, req, hpage, real_hash);
|
|
if (err)
|
|
goto out;
|
|
err = cmp_hashes(vi, want_hash, real_hash, index, level - 1);
|
|
if (err)
|
|
goto out;
|
|
SetPageChecked(hpage);
|
|
memcpy_from_page(_want_hash, hpage, hoffset, hsize);
|
|
want_hash = _want_hash;
|
|
put_page(hpage);
|
|
pr_debug("Verified hash page at level %d, now want %s:%*phN\n",
|
|
level - 1, params->hash_alg->name, hsize, want_hash);
|
|
}
|
|
|
|
/* Finally, verify the data page */
|
|
err = fsverity_hash_page(params, inode, req, data_page, real_hash);
|
|
if (err)
|
|
goto out;
|
|
err = cmp_hashes(vi, want_hash, real_hash, index, -1);
|
|
out:
|
|
for (; level > 0; level--)
|
|
put_page(hpages[level - 1]);
|
|
|
|
return err == 0;
|
|
}
|
|
|
|
/**
|
|
* fsverity_verify_page() - verify a data page
|
|
* @page: the page to verity
|
|
*
|
|
* Verify a page that has just been read from a verity file. The page must be a
|
|
* pagecache page that is still locked and not yet uptodate.
|
|
*
|
|
* Return: true if the page is valid, else false.
|
|
*/
|
|
bool fsverity_verify_page(struct page *page)
|
|
{
|
|
struct inode *inode = page->mapping->host;
|
|
const struct fsverity_info *vi = inode->i_verity_info;
|
|
struct ahash_request *req;
|
|
bool valid;
|
|
|
|
/* This allocation never fails, since it's mempool-backed. */
|
|
req = fsverity_alloc_hash_request(vi->tree_params.hash_alg, GFP_NOFS);
|
|
|
|
valid = verify_page(inode, vi, req, page, 0);
|
|
|
|
fsverity_free_hash_request(vi->tree_params.hash_alg, req);
|
|
|
|
return valid;
|
|
}
|
|
EXPORT_SYMBOL_GPL(fsverity_verify_page);
|
|
|
|
#ifdef CONFIG_BLOCK
|
|
/**
|
|
* fsverity_verify_bio() - verify a 'read' bio that has just completed
|
|
* @bio: the bio to verify
|
|
*
|
|
* Verify a set of pages that have just been read from a verity file. The pages
|
|
* must be pagecache pages that are still locked and not yet uptodate. If a
|
|
* page fails verification, then bio->bi_status is set to an error status.
|
|
*
|
|
* This is a helper function for use by the ->readahead() method of filesystems
|
|
* that issue bios to read data directly into the page cache. Filesystems that
|
|
* populate the page cache without issuing bios (e.g. non block-based
|
|
* filesystems) must instead call fsverity_verify_page() directly on each page.
|
|
* All filesystems must also call fsverity_verify_page() on holes.
|
|
*/
|
|
void fsverity_verify_bio(struct bio *bio)
|
|
{
|
|
struct inode *inode = bio_first_page_all(bio)->mapping->host;
|
|
const struct fsverity_info *vi = inode->i_verity_info;
|
|
const struct merkle_tree_params *params = &vi->tree_params;
|
|
struct ahash_request *req;
|
|
struct bio_vec *bv;
|
|
struct bvec_iter_all iter_all;
|
|
unsigned long max_ra_pages = 0;
|
|
|
|
/* This allocation never fails, since it's mempool-backed. */
|
|
req = fsverity_alloc_hash_request(params->hash_alg, GFP_NOFS);
|
|
|
|
if (bio->bi_opf & REQ_RAHEAD) {
|
|
/*
|
|
* If this bio is for data readahead, then we also do readahead
|
|
* of the first (largest) level of the Merkle tree. Namely,
|
|
* when a Merkle tree page is read, we also try to piggy-back on
|
|
* some additional pages -- up to 1/4 the number of data pages.
|
|
*
|
|
* This improves sequential read performance, as it greatly
|
|
* reduces the number of I/O requests made to the Merkle tree.
|
|
*/
|
|
bio_for_each_segment_all(bv, bio, iter_all)
|
|
max_ra_pages++;
|
|
max_ra_pages /= 4;
|
|
}
|
|
|
|
bio_for_each_segment_all(bv, bio, iter_all) {
|
|
struct page *page = bv->bv_page;
|
|
unsigned long level0_index = page->index >> params->log_arity;
|
|
unsigned long level0_ra_pages =
|
|
min(max_ra_pages, params->level0_blocks - level0_index);
|
|
|
|
if (!verify_page(inode, vi, req, page, level0_ra_pages)) {
|
|
bio->bi_status = BLK_STS_IOERR;
|
|
break;
|
|
}
|
|
}
|
|
|
|
fsverity_free_hash_request(params->hash_alg, req);
|
|
}
|
|
EXPORT_SYMBOL_GPL(fsverity_verify_bio);
|
|
#endif /* CONFIG_BLOCK */
|
|
|
|
/**
|
|
* fsverity_enqueue_verify_work() - enqueue work on the fs-verity workqueue
|
|
* @work: the work to enqueue
|
|
*
|
|
* Enqueue verification work for asynchronous processing.
|
|
*/
|
|
void fsverity_enqueue_verify_work(struct work_struct *work)
|
|
{
|
|
queue_work(fsverity_read_workqueue, work);
|
|
}
|
|
EXPORT_SYMBOL_GPL(fsverity_enqueue_verify_work);
|
|
|
|
int __init fsverity_init_workqueue(void)
|
|
{
|
|
/*
|
|
* Use an unbound workqueue to allow bios to be verified in parallel
|
|
* even when they happen to complete on the same CPU. This sacrifices
|
|
* locality, but it's worthwhile since hashing is CPU-intensive.
|
|
*
|
|
* Also use a high-priority workqueue to prioritize verification work,
|
|
* which blocks reads from completing, over regular application tasks.
|
|
*/
|
|
fsverity_read_workqueue = alloc_workqueue("fsverity_read_queue",
|
|
WQ_UNBOUND | WQ_HIGHPRI,
|
|
num_online_cpus());
|
|
if (!fsverity_read_workqueue)
|
|
return -ENOMEM;
|
|
return 0;
|
|
}
|
|
|
|
void __init fsverity_exit_workqueue(void)
|
|
{
|
|
destroy_workqueue(fsverity_read_workqueue);
|
|
fsverity_read_workqueue = NULL;
|
|
}
|