// SPDX-License-Identifier: GPL-2.0 /* * fs/ext4/verity.c: fs-verity support for ext4 * * Copyright 2019 Google LLC
*/
/* * Implementation of fsverity_operations for ext4. * * ext4 stores the verity metadata (Merkle tree and fsverity_descriptor) past * the end of the file, starting at the first 64K boundary beyond i_size. This * approach works because (a) verity files are readonly, and (b) pages fully * beyond i_size aren't visible to userspace but can be read/written internally * by ext4 with only some relatively small changes to ext4. This approach * avoids having to depend on the EA_INODE feature and on rearchitecturing * ext4's xattr support to support paging multi-gigabyte xattrs into memory, and * to support encrypting xattrs. Note that the verity metadata *must* be * encrypted when the file is, since it contains hashes of the plaintext data. * * Using a 64K boundary rather than a 4K one keeps things ready for * architectures with 64K pages, and it doesn't necessarily waste space on-disk * since there can be a hole between i_size and the start of the Merkle tree.
*/
/* * Read some verity metadata from the inode. __vfs_read() can't be used because * we need to read beyond i_size.
*/ staticint pagecache_read(struct inode *inode, void *buf, size_t count,
loff_t pos)
{ while (count) { struct folio *folio;
size_t n;
n = memcpy_from_file_folio(buf, folio, pos, count);
folio_put(folio);
buf += n;
pos += n;
count -= n;
} return 0;
}
/* * Write some verity metadata to the inode for FS_IOC_ENABLE_VERITY. * kernel_write() can't be used because the file descriptor is readonly.
*/ staticint pagecache_write(struct inode *inode, constvoid *buf, size_t count,
loff_t pos)
{ struct address_space *mapping = inode->i_mapping; conststruct address_space_operations *aops = mapping->a_ops;
if (pos + count > inode->i_sb->s_maxbytes) return -EFBIG;
while (count) {
size_t n = min_t(size_t, count,
PAGE_SIZE - offset_in_page(pos)); struct folio *folio; void *fsdata = NULL; int res;
res = aops->write_begin(NULL, mapping, pos, n, &folio, &fsdata); if (res) return res;
res = aops->write_end(NULL, mapping, pos, n, n, folio, fsdata); if (res < 0) return res; if (res != n) return -EIO;
buf += n;
pos += n;
count -= n;
} return 0;
}
staticint ext4_begin_enable_verity(struct file *filp)
{ struct inode *inode = file_inode(filp); constint credits = 2; /* superblock and inode for ext4_orphan_add() */
handle_t *handle; int err;
if (IS_DAX(inode) || ext4_test_inode_flag(inode, EXT4_INODE_DAX)) return -EINVAL;
if (ext4_verity_in_progress(inode)) return -EBUSY;
/* * Since the file was opened readonly, we have to initialize the jbd * inode and quotas here and not rely on ->open() doing it. This must * be done before evicting the inline data.
*/
err = ext4_inode_attach_jinode(inode); if (err) return err;
err = dquot_initialize(inode); if (err) return err;
err = ext4_convert_inline_data(inode); if (err) return err;
if (!ext4_test_inode_flag(inode, EXT4_INODE_EXTENTS)) {
ext4_warning_inode(inode, "verity is only allowed on extent-based files"); return -EOPNOTSUPP;
}
/* * ext4 uses the last allocated block to find the verity descriptor, so * we must remove any other blocks past EOF which might confuse things.
*/
err = ext4_truncate(inode); if (err) return err;
handle = ext4_journal_start(inode, EXT4_HT_INODE, credits); if (IS_ERR(handle)) return PTR_ERR(handle);
err = ext4_orphan_add(handle, inode); if (err == 0)
ext4_set_inode_state(inode, EXT4_STATE_VERITY_IN_PROGRESS);
ext4_journal_stop(handle); return err;
}
/* * ext4 stores the verity descriptor beginning on the next filesystem block * boundary after the Merkle tree. Then, the descriptor size is stored in the * last 4 bytes of the last allocated filesystem block --- which is either the * block in which the descriptor ends, or the next block after that if there * weren't at least 4 bytes remaining. * * We can't simply store the descriptor in an xattr because it *must* be * encrypted when ext4 encryption is used, but ext4 encryption doesn't encrypt * xattrs. Also, if the descriptor includes a large signature blob it may be * too large to store in an xattr without the EA_INODE feature.
*/ staticint ext4_write_verity_descriptor(struct inode *inode, constvoid *desc,
size_t desc_size, u64 merkle_tree_size)
{ const u64 desc_pos = round_up(ext4_verity_metadata_pos(inode) +
merkle_tree_size, i_blocksize(inode)); const u64 desc_end = desc_pos + desc_size; const __le32 desc_size_disk = cpu_to_le32(desc_size); const u64 desc_size_pos = round_up(desc_end + sizeof(desc_size_disk),
i_blocksize(inode)) - sizeof(desc_size_disk); int err;
err = pagecache_write(inode, desc, desc_size, desc_pos); if (err) return err;
/* * If an error already occurred (which fs/verity/ signals by passing * desc == NULL), then only clean-up is needed.
*/ if (desc == NULL) goto cleanup;
/* Append the verity descriptor. */
err = ext4_write_verity_descriptor(inode, desc, desc_size,
merkle_tree_size); if (err) goto cleanup;
/* * Write all pages (both data and verity metadata). Note that this must * happen before clearing EXT4_STATE_VERITY_IN_PROGRESS; otherwise pages * beyond i_size won't be written properly. For crash consistency, this * also must happen before the verity inode flag gets persisted.
*/
err = filemap_write_and_wait(inode->i_mapping); if (err) goto cleanup;
/* * Finally, set the verity inode flag and remove the inode from the * orphan list (in a single transaction).
*/
stop_and_cleanup:
ext4_journal_stop(handle);
cleanup: /* * Verity failed to be enabled, so clean up by truncating any verity * metadata that was written beyond i_size (both from cache and from * disk), removing the inode from the orphan list (if it wasn't done * already), and clearing EXT4_STATE_VERITY_IN_PROGRESS.
*/
truncate_inode_pages(inode->i_mapping, inode->i_size);
ext4_truncate(inode);
ext4_orphan_del(NULL, inode);
ext4_clear_inode_state(inode, EXT4_STATE_VERITY_IN_PROGRESS); return err;
}
Die Informationen auf dieser Webseite wurden
nach bestem Wissen sorgfältig zusammengestellt. Es wird jedoch weder Vollständigkeit, noch Richtigkeit,
noch Qualität der bereit gestellten Informationen zugesichert.
Bemerkung:
Die farbliche Syntaxdarstellung und die Messung sind noch experimentell.