ref: 9944bc0d5f4e34f0cf3fd4ce8b3661fdc89e1cf2
parent: bf878b59ccb34a4cdafa48dbcdcd57c22f335c03
author: Sigrid Solveig Haflínudóttir <ftrvxmtrx@gmail.com>
date: Sun Nov 15 07:42:21 EST 2020
replace extents implementation with the updated one, bsd-licensed
--- a/README.md
+++ b/README.md
@@ -43,7 +43,6 @@
files must be removed first. At this point there are two files
licensed under GPLv2:
* ext4_xattr.c
-* ext4_extents.c
All other modules and headers are BSD-3-Clause licensed code.
--- a/include/ext4_extent.h
+++ b/include/ext4_extent.h
@@ -1,6 +1,7 @@
/*
* Copyright (c) 2013 Grzegorz Kostka (kostka.grzegorz@gmail.com)
*
+ *
* HelenOS:
* Copyright (c) 2012 Martin Sucha
* Copyright (c) 2012 Frantisek Princ
@@ -46,21 +47,314 @@
#include <ext4_config.h>
#include <ext4_types.h>
+#include <ext4_misc.h>
+
#include <ext4_inode.h>
-void ext4_extent_tree_init(struct ext4_inode_ref *inode_ref);
+/*
+ * Array of ext4_ext_path contains path to some extent.
+ * Creation/lookup routines use it for traversal/splitting/etc.
+ * Truncate uses it to simulate recursive walking.
+ */
+struct ext4_extent_path {
+ struct ext4_block block;
+ uint16_t depth;
+ struct ext4_extent_header *header;
+ struct ext4_extent_index *index;
+ struct ext4_extent *extent;
+};
+#define EXT4_EXT_UNWRITTEN_MASK (1L << 15)
-int ext4_extent_get_blocks(struct ext4_inode_ref *inode_ref, ext4_lblk_t iblock,
- uint32_t max_blocks, ext4_fsblk_t *result, bool create,
- uint32_t *blocks_count);
+#define EXT4_EXT_MAX_LEN_WRITTEN (1L << 15)
+#define EXT4_EXT_MAX_LEN_UNWRITTEN \
+ (EXT4_EXT_MAX_LEN_WRITTEN - 1)
+#define EXT4_EXT_GET_LEN(ex) to_le16((ex)->nblocks)
+#define EXT4_EXT_GET_LEN_UNWRITTEN(ex) \
+ (EXT4_EXT_GET_LEN(ex) &= ~(EXT4_EXT_UNWRITTEN_MASK))
+#define EXT4_EXT_SET_LEN(ex, count) \
+ ((ex)->nblocks = to_le16(count))
+#define EXT4_EXT_IS_UNWRITTEN(ex) \
+ (EXT4_EXT_GET_LEN(ex) > EXT4_EXT_MAX_LEN_WRITTEN)
+#define EXT4_EXT_SET_UNWRITTEN(ex) \
+ ((ex)->nblocks |= to_le16(EXT4_EXT_UNWRITTEN_MASK))
+#define EXT4_EXT_SET_WRITTEN(ex) \
+ ((ex)->nblocks &= ~(to_le16(EXT4_EXT_UNWRITTEN_MASK)))
+
+#define EXT4_EXTENT_FIRST(header) \
+ ((struct ext4_extent *)(((char *)(header)) + \
+ sizeof(struct ext4_extent_header)))
+
+#define EXT4_EXTENT_FIRST_INDEX(header) \
+ ((struct ext4_extent_index *)(((char *)(header)) + \
+ sizeof(struct ext4_extent_header)))
+
+#define EXT4_EXTENT_LAST(header) \
+ ((struct ext4_extent *)(((char *)(header)) + \
+ sizeof(struct ext4_extent_header)) + \
+ (header)->nentries - 1)
+
+#define EXT4_EXTENT_LAST_INDEX(header) \
+ ((struct ext4_extent_index *)(((char *)(header)) + \
+ sizeof(struct ext4_extent_header)) + \
+ (header)->nentries - 1)
+
+#define EXT4_EXTENT_SIZE sizeof(struct ext4_extent)
+#define EXT4_EXTENT_INDEX_SIZE sizeof(struct ext4_extent_index)
+
+#define EXT4_EXTENT_TAIL_OFFSET(hdr) \
+ (sizeof(struct ext4_extent_header) + \
+ (sizeof(struct ext4_extent) * to_le16((hdr)->max_nentries)))
+
+#define EXT4_EXTENT_IN_RANGE(iblock, eiblock, len) \
+ ((iblock) >= (eiblock) && (iblock) <= (eiblock) + (len) - 1)
+
+#define EXT4_EXTENT_MAX_BLOCKS ((uint32_t)(-1))
+
+/**@brief Get logical number of the block covered by extent.
+ * @param extent Extent to load number from
+ * @return Logical number of the first block covered by extent */
+static inline uint32_t ext4_extent_get_iblock(struct ext4_extent *extent)
+{
+ return to_le32(extent->iblock);
+}
+
+/**@brief Set logical number of the first block covered by extent.
+ * @param extent Extent to set number to
+ * @param iblock Logical number of the first block covered by extent */
+static inline void ext4_extent_set_iblock(struct ext4_extent *extent,
+ ext4_lblk_t iblock)
+{
+ extent->iblock = to_le32(iblock);
+}
+
+/**@brief Get number of blocks covered by extent.
+ * @param extent Extent to load count from
+ * @return Number of blocks covered by extent */
+static inline uint16_t ext4_extent_get_nblocks(struct ext4_extent *extent)
+{
+ if (EXT4_EXT_IS_UNWRITTEN(extent))
+ return EXT4_EXT_GET_LEN_UNWRITTEN(extent);
+ else
+ return EXT4_EXT_GET_LEN(extent);
+}
+/**@brief Set number of blocks covered by extent.
+ * @param extent Extent to load count from
+ * @param count Number of blocks covered by extent
+ * @param unwritten Whether the extent is unwritten or not */
+static inline void
+ext4_extent_set_nblocks(struct ext4_extent *extent,
+ uint16_t count, bool unwritten)
+{
+ EXT4_EXT_SET_LEN(extent, count);
+ if (unwritten)
+ EXT4_EXT_SET_UNWRITTEN(extent);
+}
+
+/**@brief Get physical number of the first block covered by extent.
+ * @param extent Extent to load number
+ * @return Physical number of the first block covered by extent */
+static inline uint64_t ext4_extent_get_fblock(struct ext4_extent *extent)
+{
+ return ((uint64_t)to_le16(extent->fblock_hi)) << 32 |
+ ((uint64_t)to_le32(extent->fblock_lo));
+}
+
+
+/**@brief Set physical number of the first block covered by extent.
+ * @param extent Extent to load number
+ * @param fblock Physical number of the first block covered by extent */
+static inline void
+ext4_extent_set_fblock(struct ext4_extent *extent, uint64_t fblock)
+{
+ extent->fblock_lo = to_le32((fblock << 32) >> 32);
+ extent->fblock_hi = to_le16((uint16_t)(fblock >> 32));
+}
+
+
+/**@brief Get logical number of the block covered by extent index.
+ * @param index Extent index to load number from
+ * @return Logical number of the first block covered by extent index */
+static inline uint32_t
+ext4_extent_index_get_iblock(struct ext4_extent_index *index)
+{
+ return to_le32(index->iblock);
+}
+
+/**@brief Set logical number of the block covered by extent index.
+ * @param index Extent index to set number to
+ * @param iblock Logical number of the first block covered by extent index */
+static inline void
+ext4_extent_index_set_iblock(struct ext4_extent_index *index,
+ uint32_t iblock)
+{
+ index->iblock = to_le32(iblock);
+}
+
+/**@brief Get physical number of block where the child node is located.
+ * @param index Extent index to load number from
+ * @return Physical number of the block with child node */
+static inline uint64_t
+ext4_extent_index_get_fblock(struct ext4_extent_index *index)
+{
+ return ((uint64_t)to_le16(index->fblock_hi)) << 32 |
+ ((uint64_t)to_le32(index->fblock_lo));
+}
+
+/**@brief Set physical number of block where the child node is located.
+ * @param index Extent index to set number to
+ * @param fblock Ohysical number of the block with child node */
+static inline void ext4_extent_index_set_fblock(struct ext4_extent_index *index,
+ uint64_t fblock)
+{
+ index->fblock_lo = to_le32((fblock << 32) >> 32);
+ index->fblock_hi = to_le16((uint16_t)(fblock >> 32));
+}
+
+/**@brief Get magic value from extent header.
+ * @param header Extent header to load value from
+ * @return Magic value of extent header */
+static inline uint16_t
+ext4_extent_header_get_magic(struct ext4_extent_header *header)
+{
+ return to_le16(header->magic);
+}
+
+/**@brief Set magic value to extent header.
+ * @param header Extent header to set value to
+ * @param magic Magic value of extent header */
+static inline void ext4_extent_header_set_magic(struct ext4_extent_header *header,
+ uint16_t magic)
+{
+ header->magic = to_le16(magic);
+}
+
+/**@brief Get number of entries from extent header
+ * @param header Extent header to get value from
+ * @return Number of entries covered by extent header */
+static inline uint16_t
+ext4_extent_header_get_nentries(struct ext4_extent_header *header)
+{
+ return to_le16(header->nentries);
+}
+
+/**@brief Set number of entries to extent header
+ * @param header Extent header to set value to
+ * @param count Number of entries covered by extent header */
+static inline void
+ext4_extent_header_set_nentries(struct ext4_extent_header *header,
+ uint16_t count)
+{
+ header->nentries = to_le16(count);
+}
+
+/**@brief Get maximum number of entries from extent header
+ * @param header Extent header to get value from
+ * @return Maximum number of entries covered by extent header */
+static inline uint16_t
+ext4_extent_header_get_max_nentries(struct ext4_extent_header *header)
+{
+ return to_le16(header->max_nentries);
+}
+
+/**@brief Set maximum number of entries to extent header
+ * @param header Extent header to set value to
+ * @param max_count Maximum number of entries covered by extent header */
+static inline void
+ext4_extent_header_set_max_nentries(struct ext4_extent_header *header,
+ uint16_t max_count)
+{
+ header->max_nentries = to_le16(max_count);
+}
+
+/**@brief Get depth of extent subtree.
+ * @param header Extent header to get value from
+ * @return Depth of extent subtree */
+static inline uint16_t
+ext4_extent_header_get_depth(struct ext4_extent_header *header)
+{
+ return to_le16(header->depth);
+}
+
+/**@brief Set depth of extent subtree.
+ * @param header Extent header to set value to
+ * @param depth Depth of extent subtree */
+static inline void
+ext4_extent_header_set_depth(struct ext4_extent_header *header,
+ uint16_t depth)
+{
+ header->depth = to_le16(depth);
+}
+
+/**@brief Get generation from extent header
+ * @param header Extent header to get value from
+ * @return Generation */
+static inline uint32_t
+ext4_extent_header_get_generation(struct ext4_extent_header *header)
+{
+ return to_le32(header->generation);
+}
+
+/**@brief Set generation to extent header
+ * @param header Extent header to set value to
+ * @param generation Generation */
+static inline void
+ext4_extent_header_set_generation(struct ext4_extent_header *header,
+ uint32_t generation)
+{
+ header->generation = to_le32(generation);
+}
+
+/******************************************************************************/
+
+/**TODO: */
+static inline void ext4_extent_tree_init(struct ext4_inode_ref *inode_ref)
+{
+ /* Initialize extent root header */
+ struct ext4_extent_header *header =
+ ext4_inode_get_extent_header(inode_ref->inode);
+ ext4_extent_header_set_depth(header, 0);
+ ext4_extent_header_set_nentries(header, 0);
+ ext4_extent_header_set_generation(header, 0);
+ ext4_extent_header_set_magic(header, EXT4_EXTENT_MAGIC);
+
+ uint16_t max_entries = (EXT4_INODE_BLOCKS * sizeof(uint32_t) -
+ sizeof(struct ext4_extent_header)) /
+ sizeof(struct ext4_extent);
+
+ ext4_extent_header_set_max_nentries(header, max_entries);
+ inode_ref->dirty = true;
+}
+
+
+
+/**@brief Extent-based blockmap manipulation
+ * @param inode_ref I-node
+ * @param iblock starting logical block of the inode
+ * @param max_nblocks maximum number of blocks to get from/allocate to blockmap
+ * @param resfblockp return physical block address of the first block of an
+ * extent
+ * @param create true if caller wants to insert mapping or convert
+ * unwritten mapping to written one
+ * @param resnblocksp return number of blocks in an extent (must be smaller than
+ * \p max_nblocks)
+ * @return Error code*/
+int ext4_extent_get_blocks(struct ext4_inode_ref *inode_ref,
+ ext4_lblk_t iblock,
+ ext4_lblk_t max_nblocks,
+ ext4_fsblk_t *resfblockp,
+ bool create,
+ ext4_lblk_t *resnblocksp);
+
+
/**@brief Release all data blocks starting from specified logical block.
* @param inode_ref I-node to release blocks from
* @param iblock_from First logical block to release
* @return Error code */
-int ext4_extent_remove_space(struct ext4_inode_ref *inode_ref, ext4_lblk_t from,
+int ext4_extent_remove_space(struct ext4_inode_ref *inode_ref,
+ ext4_lblk_t from,
ext4_lblk_t to);
--- a/include/ext4_types.h
+++ b/include/ext4_types.h
@@ -617,9 +617,71 @@
#define EXT4_JOURNAL_INO 8
#define EXT4_GOOD_OLD_FIRST_INO 11
-#define EXT_MAX_BLOCKS (ext4_lblk_t) (-1)
-#define IN_RANGE(b, first, len) ((b) >= (first) && (b) <= (first) + (len) - 1)
+#ifdef __plan9__
+#pragma pack on
+#else
+#pragma pack(push)
+#endif
+
+/*
+ * This is the extent tail on-disk structure.
+ * All other extent structures are 12 bytes long. It turns out that
+ * block size % 12 >= 4 for at least all powers of 2 greater than 512, which
+ * covers all valid ext4 block sizes. Therefore, this tail structure can be
+ * crammed into the end of the block without having to rebalance the tree.
+ */
+struct ext4_extent_tail
+{
+ uint32_t checksum; /* crc32c(uuid+inum+extent_block) */
+};
+
+/*
+ * This is the extent on-disk structure.
+ * It's used at the bottom of the tree.
+ */
+struct ext4_extent {
+ uint32_t iblock; /* First logical block extent covers */
+ uint16_t nblocks; /* Number of blocks covered by extent */
+ uint16_t fblock_hi; /* High 16 bits of physical block */
+ uint32_t fblock_lo; /* Low 32 bits of physical block */
+};
+
+/*
+ * This is index on-disk structure.
+ * It's used at all the levels except the bottom.
+ */
+struct ext4_extent_index {
+ uint32_t iblock; /* Index covers logical blocks from 'block' */
+
+ /**
+ * Pointer to the physical block of the next
+ * level. leaf or next index could be there
+ * high 16 bits of physical block
+ */
+ uint32_t fblock_lo;
+ uint16_t fblock_hi;
+ uint16_t padding;
+};
+
+/*
+ * Each block (leaves and indexes), even inode-stored has header.
+ */
+struct ext4_extent_header {
+ uint16_t magic;
+ uint16_t nentries; /* Number of valid entries */
+ uint16_t max_nentries; /* Capacity of store in entries */
+ uint16_t depth; /* Has tree real underlying blocks? */
+ uint32_t generation; /* generation of the tree */
+};
+
+#ifdef __plan9__
+#pragma pack off
+#else
+#pragma pack(pop)
+#endif
+
+#define EXT4_EXTENT_MAGIC 0xF30A
/******************************************************************************/
--- a/src/ext4_extent.c
+++ b/src/ext4_extent.c
@@ -1,2150 +1,2294 @@
/*
- * Copyright (c) 2017 Grzegorz Kostka (kostka.grzegorz@gmail.com)
* Copyright (c) 2017 Kaho Ng (ngkaho1234@gmail.com)
+ * Copyright (c) 2017 Grzegorz Kostka (kostka.grzegorz@gmail.com)
*
- * This program is free software; you can redistribute it and/or
- * modify it under the terms of the GNU General Public License
- * as published by the Free Software Foundation; either version 2
- * of the License, or (at your option) any later version.
+ *
+ * HelenOS:
+ * Copyright (c) 2012 Martin Sucha
+ * Copyright (c) 2012 Frantisek Princ
+ * All rights reserved.
+ *
+ * Redistribution and use in source and binary forms, with or without
+ * modification, are permitted provided that the following conditions
+ * are met:
+ *
+ * - Redistributions of source code must retain the above copyright
+ * notice, this list of conditions and the following disclaimer.
+ * - Redistributions in binary form must reproduce the above copyright
+ * notice, this list of conditions and the following disclaimer in the
+ * documentation and/or other materials provided with the distribution.
+ * - The name of the author may not be used to endorse or promote products
+ * derived from this software without specific prior written permission.
+ *
+ * THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR
+ * IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES
+ * OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE DISCLAIMED.
+ * IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, INDIRECT,
+ * INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT
+ * NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
+ * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
+ * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
+ * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF
+ * THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
-#include <ext4.h>
+/** @addtogroup lwext4
+ * @{
+ */
+/**
+ * @file ext4_extent.c
+ * @brief More complex filesystem functions.
+ */
-#include <ext4_blockdev.h>
-#include <ext4_trans.h>
+#include <ext4_config.h>
+#include <ext4_errno.h>
+#include <ext4_debug.h>
+
#include <ext4_fs.h>
+#include <ext4_trans.h>
+#include <ext4_blockdev.h>
+#include <ext4_extent.h>
+#include <ext4_inode.h>
#include <ext4_super.h>
#include <ext4_crc32.h>
#include <ext4_balloc.h>
-#include <ext4_extent.h>
-#include <stdlib.h>
#include <string.h>
-#include <inttypes.h>
-#include <stddef.h>
+#include <stdlib.h>
-#if CONFIG_EXTENTS_ENABLE
-/*
- * used by extent splitting.
- */
-#define EXT4_EXT_MARK_UNWRIT1 0x02 /* mark first half unwritten */
-#define EXT4_EXT_MARK_UNWRIT2 0x04 /* mark second half unwritten */
-#define EXT4_EXT_DATA_VALID1 0x08 /* first half contains valid data */
-#define EXT4_EXT_DATA_VALID2 0x10 /* second half contains valid data */
-#define EXT4_EXT_NO_COMBINE 0x20 /* do not combine two extents */
+#if CONFIG_EXTENT_ENABLE
-#define EXT4_EXT_UNWRITTEN_MASK (1L << 15)
+/**@brief Return the extent tree depth
+ * @param inode_ref I-node reference the tree belongs to
+ * @return Depth of extent tree */
+static inline uint16_t
+ext4_extent_tree_depth(struct ext4_inode_ref *inode_ref)
+{
+ struct ext4_extent_header *eh;
+ eh = ext4_inode_get_extent_header(inode_ref->inode);
+ return ext4_extent_header_get_depth(eh);
+}
-#define EXT4_EXT_MAX_LEN_WRITTEN (1L << 15)
-#define EXT4_EXT_MAX_LEN_UNWRITTEN \
- (EXT4_EXT_MAX_LEN_WRITTEN - 1)
+static struct ext4_extent_tail *
+ext4_extent_get_csum_tail(struct ext4_extent_header *eh)
+{
+ return (struct ext4_extent_tail *)(((char *)eh) +
+ EXT4_EXTENT_TAIL_OFFSET(eh));
+}
-#define EXT4_EXT_GET_LEN(ex) to_le16((ex)->block_count)
-#define EXT4_EXT_GET_LEN_UNWRITTEN(ex) \
- (EXT4_EXT_GET_LEN(ex) & ~(EXT4_EXT_UNWRITTEN_MASK))
-#define EXT4_EXT_SET_LEN(ex, count) \
- ((ex)->block_count = to_le16(count))
+#if CONFIG_META_CSUM_ENABLE
+static uint32_t ext4_extent_block_csum(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_header *eh)
+{
+ uint32_t checksum = 0;
+ struct ext4_sblock *sb = &inode_ref->fs->sb;
-#define EXT4_EXT_IS_UNWRITTEN(ex) \
- (EXT4_EXT_GET_LEN(ex) > EXT4_EXT_MAX_LEN_WRITTEN)
-#define EXT4_EXT_SET_UNWRITTEN(ex) \
- ((ex)->block_count |= to_le16(EXT4_EXT_UNWRITTEN_MASK))
-#define EXT4_EXT_SET_WRITTEN(ex) \
- ((ex)->block_count &= ~(to_le16(EXT4_EXT_UNWRITTEN_MASK)))
+ if (ext4_sb_feature_ro_com(sb, EXT4_FRO_COM_METADATA_CSUM)) {
+ uint32_t ino_index = to_le32(inode_ref->index);
+ uint32_t ino_gen =
+ to_le32(ext4_inode_get_generation(inode_ref->inode));
+ /* First calculate crc32 checksum against fs uuid */
+ checksum = ext4_crc32c(EXT4_CRC32_INIT, sb->uuid,
+ sizeof(sb->uuid));
+ /* Then calculate crc32 checksum against inode number
+ * and inode generation */
+ checksum = ext4_crc32c(checksum, &ino_index,
+ sizeof(ino_index));
+ checksum = ext4_crc32c(checksum, &ino_gen,
+ sizeof(ino_gen));
+ /* Finally calculate crc32 checksum against
+ * the entire extent block up to the checksum field */
+ checksum = ext4_crc32c(checksum, eh,
+ EXT4_EXTENT_TAIL_OFFSET(eh));
+ }
+ return checksum;
+}
-/*
- * Array of ext4_ext_path contains path to some extent.
- * Creation/lookup routines use it for traversal/splitting/etc.
- * Truncate uses it to simulate recursive walking.
- */
-struct ext4_extent_path {
- ext4_fsblk_t p_block;
- struct ext4_block block;
- int32_t depth;
- int32_t maxdepth;
- struct ext4_extent_header *header;
- struct ext4_extent_index *index;
- struct ext4_extent *extent;
-};
+static bool
+ext4_extent_verify_block_csum(struct ext4_inode_ref *inode_ref,
+ struct ext4_block *block)
+{
+ uint16_t rootdepth;
+ struct ext4_extent_tail *tail;
+ struct ext4_extent_header *eh;
-#ifdef __plan9__
-#pragma pack on
-#else
-#pragma pack(push, 1)
-#endif
+ rootdepth = ext4_extent_tree_depth(inode_ref);
-/*
- * This is the extent tail on-disk structure.
- * All other extent structures are 12 bytes long. It turns out that
- * block_size % 12 >= 4 for at least all powers of 2 greater than 512, which
- * covers all valid ext4 block sizes. Therefore, this tail structure can be
- * crammed into the end of the block without having to rebalance the tree.
- */
-struct ext4_extent_tail
-{
- uint32_t et_checksum; /* crc32c(uuid+inum+extent_block) */
-};
+ if (!ext4_sb_feature_ro_com(&inode_ref->fs->sb,
+ EXT4_FRO_COM_METADATA_CSUM))
+ return true;
-/*
- * This is the extent on-disk structure.
- * It's used at the bottom of the tree.
- */
-struct ext4_extent {
- uint32_t first_block; /* First logical block extent covers */
- uint16_t block_count; /* Number of blocks covered by extent */
- uint16_t start_hi; /* High 16 bits of physical block */
- uint32_t start_lo; /* Low 32 bits of physical block */
-};
+ eh = (struct ext4_extent_header *)block->data;
+ if (ext4_extent_header_get_depth(eh) < rootdepth) {
+ tail = ext4_extent_get_csum_tail(eh);
+ return tail->checksum ==
+ to_le32(ext4_extent_block_csum(inode_ref, eh));
+ }
-/*
- * This is index on-disk structure.
- * It's used at all the levels except the bottom.
- */
-struct ext4_extent_index {
- uint32_t first_block; /* Index covers logical blocks from 'block' */
+ return true;
+}
+#else /* CONFIG_META_CSUM_ENABLE */
+#define ext4_ext_block_csum(...) 0
+#define ext4_extent_verify_block_csum(...) true
+#endif /* CONFIG_META_CSUM_ENABLE */
- /**
- * Pointer to the physical block of the next
- * level. leaf or next index could be there
- * high 16 bits of physical block
- */
- uint32_t leaf_lo;
- uint16_t leaf_hi;
- uint16_t padding;
-};
+static void
+ext4_extent_block_csum_set(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_header *eh)
+{
+ uint16_t rootdepth;
+ struct ext4_extent_tail *tail;
-/*
- * Each block (leaves and indexes), even inode-stored has header.
- */
-struct ext4_extent_header {
- uint16_t magic;
- uint16_t entries_count; /* Number of valid entries */
- uint16_t max_entries_count; /* Capacity of store in entries */
- uint16_t depth; /* Has tree real underlying blocks? */
- uint32_t generation; /* generation of the tree */
-};
+ rootdepth = ext4_extent_tree_depth(inode_ref);
-#ifdef __plan9__
-#pragma pack off
-#else
-#pragma pack(pop)
-#endif
+ if (!ext4_sb_feature_ro_com(&inode_ref->fs->sb,
+ EXT4_FRO_COM_METADATA_CSUM))
+ return;
-#define EXT4_EXTENT_MAGIC 0xF30A
+ if (ext4_extent_header_get_depth(eh) < rootdepth) {
+ tail = ext4_extent_get_csum_tail(eh);
+ tail->checksum = to_le32(ext4_extent_block_csum(inode_ref, eh));
+ }
+}
-#define EXT4_EXTENT_FIRST(header) \
- ((struct ext4_extent *)(((char *)(header)) + \
- sizeof(struct ext4_extent_header)))
+#if CONFIG_EXTENT_DEBUG_VERBOSE
+static void
+ext4_extent_print_path(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path)
+{
+ uint16_t rootdepth;
+ struct ext4_extent_path *p;
-#define EXT4_EXTENT_FIRST_INDEX(header) \
- ((struct ext4_extent_index *)(((char *)(header)) + \
- sizeof(struct ext4_extent_header)))
+ rootdepth = ext4_extent_tree_depth(inode_ref);
+ p = path + rootdepth;
-/*
- * EXT_INIT_MAX_LEN is the maximum number of blocks we can have in an
- * initialized extent. This is 2^15 and not (2^16 - 1), since we use the
- * MSB of ee_len field in the extent datastructure to signify if this
- * particular extent is an initialized extent or an uninitialized (i.e.
- * preallocated).
- * EXT_UNINIT_MAX_LEN is the maximum number of blocks we can have in an
- * uninitialized extent.
- * If ee_len is <= 0x8000, it is an initialized extent. Otherwise, it is an
- * uninitialized one. In other words, if MSB of ee_len is set, it is an
- * uninitialized extent with only one special scenario when ee_len = 0x8000.
- * In this case we can not have an uninitialized extent of zero length and
- * thus we make it as a special case of initialized extent with 0x8000 length.
- * This way we get better extent-to-group alignment for initialized extents.
- * Hence, the maximum number of blocks we can have in an *initialized*
- * extent is 2^15 (32768) and in an *uninitialized* extent is 2^15-1 (32767).
- */
-#define EXT_INIT_MAX_LEN (1L << 15)
-#define EXT_UNWRITTEN_MAX_LEN (EXT_INIT_MAX_LEN - 1)
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Path address: %p\n", path);
+ while (p >= path) {
+ uint16_t i;
+ uint16_t entries =
+ ext4_extent_header_get_nentries(p->header);
+ uint16_t limit =
+ ext4_extent_header_get_max_nentries(p->header);
-#define EXT_EXTENT_SIZE sizeof(struct ext4_extent)
-#define EXT_INDEX_SIZE sizeof(struct ext4_extent_idx)
+ ext4_dbg(DEBUG_EXTENT,
+DBG_INFO "-- Block: %" PRIu64 ", Depth: %" PRIu16 ", Entries: %" PRIu16 ", Limit: %" PRIu16 "\n",
+ p->block.lb_id, p->depth, entries, limit);
+ for (i = 0; i < entries; i++) {
+ if (p->depth) {
+ struct ext4_extent_index *index;
-#define EXT_FIRST_EXTENT(__hdr__) \
- ((struct ext4_extent *)(((char *)(__hdr__)) + \
- sizeof(struct ext4_extent_header)))
-#define EXT_FIRST_INDEX(__hdr__) \
- ((struct ext4_extent_index *)(((char *)(__hdr__)) + \
- sizeof(struct ext4_extent_header)))
-#define EXT_HAS_FREE_INDEX(__path__) \
- (to_le16((__path__)->header->entries_count) < \
- to_le16((__path__)->header->max_entries_count))
-#define EXT_LAST_EXTENT(__hdr__) \
- (EXT_FIRST_EXTENT((__hdr__)) + to_le16((__hdr__)->entries_count) - 1)
-#define EXT_LAST_INDEX(__hdr__) \
- (EXT_FIRST_INDEX((__hdr__)) + to_le16((__hdr__)->entries_count) - 1)
-#define EXT_MAX_EXTENT(__hdr__) \
- (EXT_FIRST_EXTENT((__hdr__)) + to_le16((__hdr__)->max_entries_count) - 1)
-#define EXT_MAX_INDEX(__hdr__) \
- (EXT_FIRST_INDEX((__hdr__)) + to_le16((__hdr__)->max_entries_count) - 1)
+ index = EXT4_EXTENT_FIRST_INDEX(p->header) + i;
+ ext4_dbg(DEBUG_EXTENT,
+DBG_INFO "Index: iblock: %" PRIu32 ", fsblock: %" PRIu64 "\n",
+ ext4_extent_index_get_iblock(index),
+ ext4_extent_index_get_fblock(index));
+ } else {
+ struct ext4_extent *extent;
-#define EXT4_EXTENT_TAIL_OFFSET(hdr) \
- (sizeof(struct ext4_extent_header) + \
- (sizeof(struct ext4_extent) * to_le16((hdr)->max_entries_count)))
+ extent = EXT4_EXTENT_FIRST(p->header) + i;
+ ext4_dbg(DEBUG_EXTENT,
+DBG_INFO "Extent: iblock: %" PRIu32 ", fsblock: %" PRIu64 ", count: %" PRIu16 "\n",
+ ext4_extent_get_iblock(extent),
+ ext4_extent_get_fblock(extent),
+ ext4_extent_get_nblocks(extent));
+ }
+ }
+ p--;
+ }
-/**@brief Get logical number of the block covered by extent.
- * @param extent Extent to load number from
- * @return Logical number of the first block covered by extent */
-static inline uint32_t ext4_extent_get_first_block(struct ext4_extent *extent)
-{
- return to_le32(extent->first_block);
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "====================\n");
}
+#else /* CONFIG_EXTENT_DEBUG_VERBOSE */
+#define ext4_extent_print_path(...)
+#endif /* CONFIG_EXTENT_DEBUG_VERBOSE */
-/**@brief Set logical number of the first block covered by extent.
- * @param extent Extent to set number to
- * @param iblock Logical number of the first block covered by extent */
-static inline void ext4_extent_set_first_block(struct ext4_extent *extent,
- uint32_t iblock)
+/**@brief Binary search in extent index node.
+ * @param header Extent header of index node
+ * @param index Output value - found index will be set here
+ * @param iblock Logical block number to find in index node */
+static void ext4_extent_binsearch_idx(struct ext4_extent_header *header,
+ struct ext4_extent_index **index,
+ ext4_lblk_t iblock)
{
- extent->first_block = to_le32(iblock);
-}
+ struct ext4_extent_index *r;
+ struct ext4_extent_index *l;
+ struct ext4_extent_index *m;
-/**@brief Get number of blocks covered by extent.
- * @param extent Extent to load count from
- * @return Number of blocks covered by extent */
-static inline uint16_t ext4_extent_get_block_count(struct ext4_extent *extent)
-{
- if (EXT4_EXT_IS_UNWRITTEN(extent))
- return EXT4_EXT_GET_LEN_UNWRITTEN(extent);
- else
- return EXT4_EXT_GET_LEN(extent);
+ uint16_t nentries = ext4_extent_header_get_nentries(header);
+
+ /* Initialize bounds */
+ l = EXT4_EXTENT_FIRST_INDEX(header) + 1;
+ r = EXT4_EXTENT_FIRST_INDEX(header) + nentries - 1;
+
+ /* Do binary search */
+ while (l <= r) {
+ m = l + (r - l) / 2;
+ ext4_lblk_t eiiblock = ext4_extent_index_get_iblock(m);
+
+ if (iblock < eiiblock)
+ r = m - 1;
+ else
+ l = m + 1;
+ }
+
+ /* Set output value */
+ *index = l - 1;
}
-/**@brief Set number of blocks covered by extent.
- * @param extent Extent to load count from
- * @param count Number of blocks covered by extent
- * @param unwritten Whether the extent is unwritten or not */
-static inline void ext4_extent_set_block_count(struct ext4_extent *extent,
- uint16_t count, bool unwritten)
-{
- EXT4_EXT_SET_LEN(extent, count);
- if (unwritten)
- EXT4_EXT_SET_UNWRITTEN(extent);
-}
-/**@brief Get physical number of the first block covered by extent.
- * @param extent Extent to load number
- * @return Physical number of the first block covered by extent */
-static inline uint64_t ext4_extent_get_start(struct ext4_extent *extent)
+/**@brief Binary search in extent leaf node.
+ * @param header Extent header of leaf node
+ * @param extent Output value - found extent will be set here,
+ * or NULL if node is empty
+ * @param iblock Logical block number to find in leaf node */
+static void ext4_extent_binsearch(struct ext4_extent_header *header,
+ struct ext4_extent **extent,
+ ext4_lblk_t iblock)
{
- return ((uint64_t)to_le16(extent->start_hi)) << 32 |
- ((uint64_t)to_le32(extent->start_lo));
-}
+ struct ext4_extent *r;
+ struct ext4_extent *l;
+ struct ext4_extent *m;
+ uint16_t nentries = ext4_extent_header_get_nentries(header);
-/**@brief Set physical number of the first block covered by extent.
- * @param extent Extent to load number
- * @param fblock Physical number of the first block covered by extent */
-static inline void ext4_extent_set_start(struct ext4_extent *extent, uint64_t fblock)
-{
- extent->start_lo = to_le32((fblock << 32) >> 32);
- extent->start_hi = to_le16((uint16_t)(fblock >> 32));
-}
+ if (nentries == 0) {
+ /* this leaf is empty */
+ *extent = NULL;
+ return;
+ }
+ /* Initialize bounds */
+ l = EXT4_EXTENT_FIRST(header) + 1;
+ r = EXT4_EXTENT_FIRST(header) + nentries - 1;
-/**@brief Get logical number of the block covered by extent index.
- * @param index Extent index to load number from
- * @return Logical number of the first block covered by extent index */
-static inline uint32_t
-ext4_extent_index_get_first_block(struct ext4_extent_index *index)
-{
- return to_le32(index->first_block);
-}
+ /* Do binary search */
+ while (l <= r) {
+ m = l + (r - l) / 2;
+ ext4_lblk_t eiblock = ext4_extent_get_iblock(m);
-/**@brief Set logical number of the block covered by extent index.
- * @param index Extent index to set number to
- * @param iblock Logical number of the first block covered by extent index */
-static inline void
-ext4_extent_index_set_first_block(struct ext4_extent_index *index,
- uint32_t iblock)
-{
- index->first_block = to_le32(iblock);
-}
+ if (iblock < eiblock)
+ r = m - 1;
+ else
+ l = m + 1;
+ }
-/**@brief Get physical number of block where the child node is located.
- * @param index Extent index to load number from
- * @return Physical number of the block with child node */
-static inline uint64_t
-ext4_extent_index_get_leaf(struct ext4_extent_index *index)
-{
- return ((uint64_t)to_le16(index->leaf_hi)) << 32 |
- ((uint64_t)to_le32(index->leaf_lo));
+ /* Set output value */
+ *extent = l - 1;
}
-/**@brief Set physical number of block where the child node is located.
- * @param index Extent index to set number to
- * @param fblock Ohysical number of the block with child node */
-static inline void ext4_extent_index_set_leaf(struct ext4_extent_index *index,
- uint64_t fblock)
+static void
+ext4_extent_path_dirty(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ uint16_t depth)
{
- index->leaf_lo = to_le32((fblock << 32) >> 32);
- index->leaf_hi = to_le16((uint16_t)(fblock >> 32));
-}
+ uint16_t rootdepth;
+ rootdepth = ext4_extent_tree_depth(inode_ref);
-/**@brief Get magic value from extent header.
- * @param header Extent header to load value from
- * @return Magic value of extent header */
-static inline uint16_t
-ext4_extent_header_get_magic(struct ext4_extent_header *header)
-{
- return to_le16(header->magic);
+ if (rootdepth != depth) {
+ struct ext4_extent_path *p;
+ p = path + depth;
+ ext4_extent_block_csum_set(inode_ref, p->header);
+ ext4_trans_set_block_dirty(p->block.buf);
+ } else
+ inode_ref->dirty = true;
}
-/**@brief Set magic value to extent header.
- * @param header Extent header to set value to
- * @param magic Magic value of extent header */
-static inline void ext4_extent_header_set_magic(struct ext4_extent_header *header,
- uint16_t magic)
+static int
+ext4_extent_path_release(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path)
{
- header->magic = to_le16(magic);
-}
+ int ret = EOK;
+ uint16_t i, rootdepth;
-/**@brief Get number of entries from extent header
- * @param header Extent header to get value from
- * @return Number of entries covered by extent header */
-static inline uint16_t
-ext4_extent_header_get_entries_count(struct ext4_extent_header *header)
-{
- return to_le16(header->entries_count);
-}
+ rootdepth = ext4_extent_tree_depth(inode_ref);
-/**@brief Set number of entries to extent header
- * @param header Extent header to set value to
- * @param count Number of entries covered by extent header */
-static inline void
-ext4_extent_header_set_entries_count(struct ext4_extent_header *header,
- uint16_t count)
-{
- header->entries_count = to_le16(count);
-}
+ for (i = 0; i < rootdepth; i++) {
+ if (path[i].block.lb_id) {
+ ret = ext4_block_set(inode_ref->fs->bdev,
+ &path[i].block);
+ if (ret != EOK)
+ break;
+ }
+ }
-/**@brief Get maximum number of entries from extent header
- * @param header Extent header to get value from
- * @return Maximum number of entries covered by extent header */
-static inline uint16_t
-ext4_extent_header_get_max_entries_count(struct ext4_extent_header *header)
-{
- return to_le16(header->max_entries_count);
+ return ret;
}
-/**@brief Set maximum number of entries to extent header
- * @param header Extent header to set value to
- * @param max_count Maximum number of entries covered by extent header */
-static inline void
-ext4_extent_header_set_max_entries_count(struct ext4_extent_header *header,
- uint16_t max_count)
+/**@brief Physical block allocation hint for extent tree manipulation
+ * routines
+ * @param inode_ref I-node
+ * @return Physical block allocation hint */
+static ext4_fsblk_t
+ext4_extent_tree_alloc_goal(struct ext4_inode_ref *inode_ref)
{
- header->max_entries_count = to_le16(max_count);
-}
+ uint32_t bgid;
+ struct ext4_sblock *sb;
-/**@brief Get depth of extent subtree.
- * @param header Extent header to get value from
- * @return Depth of extent subtree */
-static inline uint16_t
-ext4_extent_header_get_depth(struct ext4_extent_header *header)
-{
- return to_le16(header->depth);
-}
+ sb = &inode_ref->fs->sb;
+ bgid = inode_ref->index / ext4_get32(sb, inodes_per_group);
-/**@brief Set depth of extent subtree.
- * @param header Extent header to set value to
- * @param depth Depth of extent subtree */
-static inline void
-ext4_extent_header_set_depth(struct ext4_extent_header *header, uint16_t depth)
-{
- header->depth = to_le16(depth);
+ /* Currently for allocations from extent tree manipulation routines,
+ * we try the blocks in the block group the inode table block refers
+ * to */
+ return ext4_fs_first_bg_block_no(sb, bgid);
}
-/**@brief Get generation from extent header
- * @param header Extent header to get value from
- * @return Generation */
-static inline uint32_t
-ext4_extent_header_get_generation(struct ext4_extent_header *header)
+/**@brief Physical block allocation hint for data blocks routines
+ * @param inode_ref I-node
+ * @param path path in the extent tree
+ * @param iblock the starting logical block of the
+ * mapping to be inserted
+ * @return Physical block allocation hint */
+static ext4_fsblk_t
+ext4_extent_data_alloc_goal(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ ext4_lblk_t iblock)
{
- return to_le32(header->generation);
-}
+ ext4_fsblk_t ret;
+ struct ext4_extent *ext;
-/**@brief Set generation to extent header
- * @param header Extent header to set value to
- * @param generation Generation */
-static inline void
-ext4_extent_header_set_generation(struct ext4_extent_header *header,
- uint32_t generation)
-{
- header->generation = to_le32(generation);
+ ext = path[0].extent;
+ if (!ext)
+ /* If there is no mapping yet, we return
+ * ext4_extent_tree_alloc_goal() as hints */
+ return ext4_extent_tree_alloc_goal(inode_ref) + iblock;
+
+ /* We want the whole file to be continuous. */
+ if (ext4_extent_get_iblock(ext) < iblock)
+ ret = ext4_extent_get_fblock(ext) +
+ iblock - ext4_extent_get_iblock(ext);
+ else {
+ if (ext4_extent_get_iblock(ext) - iblock >
+ ext4_extent_get_fblock(ext))
+ ret = ext4_extent_get_fblock(ext);
+ else
+ ret = ext4_extent_get_fblock(ext) -
+ (ext4_extent_get_iblock(ext) - iblock);
+ }
+
+ return ret;
}
-void ext4_extent_tree_init(struct ext4_inode_ref *inode_ref)
+/**@brief Verify the extent node block is valid
+ * @param inode_ref I-node
+ * @param block block buffer of the extent node block
+ * @param depth the depth of extent node wanted
+ * @return true if the block passes verification, otherwise false
+ */
+static bool ext4_extent_block_verify(struct ext4_inode_ref *inode_ref,
+ struct ext4_block *block,
+ uint16_t depth)
{
- /* Initialize extent root header */
- struct ext4_extent_header *header =
- ext4_inode_get_extent_header(inode_ref->inode);
- ext4_extent_header_set_depth(header, 0);
- ext4_extent_header_set_entries_count(header, 0);
- ext4_extent_header_set_generation(header, 0);
- ext4_extent_header_set_magic(header, EXT4_EXTENT_MAGIC);
+ uint32_t blocksz;
+ uint16_t maxnentries __unused;
+ struct ext4_extent_header *eh;
- uint16_t max_entries = (EXT4_INODE_BLOCKS * sizeof(uint32_t) -
- sizeof(struct ext4_extent_header)) /
- sizeof(struct ext4_extent);
+ eh = (struct ext4_extent_header *)block->data;
+ blocksz = ext4_sb_get_block_size(&inode_ref->fs->sb);
- ext4_extent_header_set_max_entries_count(header, max_entries);
- inode_ref->dirty = true;
-}
+ /* Check if the magic number of the extent node header is correct */
+ if (ext4_extent_header_get_magic(eh) != EXT4_EXTENT_MAGIC) {
+ ext4_dbg(DEBUG_EXTENT,
+DBG_ERROR "Extent node block header mismatch! Block number: %" PRIu64 "\n",
+ block->lb_id);
+ return false;
+ }
+ /* Check if the depth field of extent node header matches what the
+ * caller wants */
+ if (ext4_extent_header_get_depth(eh) != depth) {
+ ext4_dbg(DEBUG_EXTENT,
+DBG_ERROR "Extent node block depth mismatch! Expected: %" PRIu16 ", Got: %" PRIu16 ". Block number: %" PRIu64 "\n",
+ depth, ext4_extent_header_get_depth(eh),
+ block->lb_id);
+ return false;
+ }
-static struct ext4_extent_tail *
-find_ext4_extent_tail(struct ext4_extent_header *eh)
-{
- return (struct ext4_extent_tail *)(((char *)eh) +
- EXT4_EXTENT_TAIL_OFFSET(eh));
-}
+ /* Check if the non-root node contains entries */
+ if (!ext4_extent_header_get_nentries(eh)) {
+ ext4_dbg(DEBUG_EXTENT,
+DBG_ERROR "Extent node block does not contain any entries! Block number: %" PRIu64 "\n",
+ block->lb_id);
+ return false;
+ }
-static struct ext4_extent_header *ext_inode_hdr(struct ext4_inode *inode)
-{
- return (struct ext4_extent_header *)inode->blocks;
-}
+#if !CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ /* Make sure that the maximum entries field of the
+ * extent node header is correct */
+ maxnentries = (blocksz - sizeof(struct ext4_extent_header)) /
+ sizeof(struct ext4_extent);
-static struct ext4_extent_header *ext_block_hdr(struct ext4_block *block)
-{
- return (struct ext4_extent_header *)block->data;
-}
+ if (ext4_extent_header_get_max_nentries(eh) != maxnentries) {
+ ext4_dbg(DEBUG_EXTENT,
+DBG_ERROR "Incorrect extent node block maximum entries field! Expected: %" PRIu16 ", Got: %" PRIu16 ". Block number: %" PRIu64 "\n",
+ maxnentries,
+ ext4_extent_header_get_max_nentries(eh),
+ block->lb_id);
+ return false;
+ }
+#endif
-static uint16_t ext_depth(struct ext4_inode *inode)
-{
- return to_le16(ext_inode_hdr(inode)->depth);
-}
+ /* Check if the checksum of the block is correct */
+ if (!ext4_extent_verify_block_csum(inode_ref,
+ block)) {
+ ext4_dbg(DEBUG_EXTENT,
+DBG_ERROR "Extent node block checksum failed! Block number: %" PRIu64"\n",
+ block->lb_id);
+ return false;
+ }
-static uint16_t ext4_ext_get_actual_len(struct ext4_extent *ext)
-{
- return (to_le16(ext->block_count) <= EXT_INIT_MAX_LEN
- ? to_le16(ext->block_count)
- : (to_le16(ext->block_count) - EXT_INIT_MAX_LEN));
+ /* The block passes verification */
+ return true;
}
-static void ext4_ext_mark_initialized(struct ext4_extent *ext)
+/**@brief Find extent for specified iblock.
+ * This function is used for finding block in the extent tree with
+ * saving the path through the tree for possible future modifications.
+ * @param inode_ref I-node to read extent tree from
+ * @param iblock Iblock to find extent for
+ * @param ppath Output value - loaded path from extent tree
+ * @return Error code */
+static int ext4_extent_find_extent(struct ext4_inode_ref *inode_ref,
+ ext4_lblk_t iblock,
+ struct ext4_extent_path **ppath)
{
- ext->block_count = to_le16(ext4_ext_get_actual_len(ext));
-}
+ struct ext4_extent_header *eh;
+ int ret;
+ uint16_t depth;
+ uint16_t k;
+ struct ext4_extent_path *tpath;
-static void ext4_ext_mark_unwritten(struct ext4_extent *ext)
-{
- ext->block_count |= to_le16(EXT_INIT_MAX_LEN);
-}
+ depth = ext4_extent_tree_depth(inode_ref);
+ eh = ext4_inode_get_extent_header(inode_ref->inode);
-static int ext4_ext_is_unwritten(struct ext4_extent *ext)
-{
- /* Extent with ee_len of 0x8000 is treated as an initialized extent */
- return (to_le16(ext->block_count) > EXT_INIT_MAX_LEN);
-}
+ /* Added 2 for possible tree growing (1 extra depth) */
+ tpath = ext4_malloc(sizeof(struct ext4_extent_path) * (depth + 2));
+ if (tpath == NULL)
+ return ENOMEM;
-/*
- * ext4_ext_pblock:
- * combine low and high parts of physical block number into ext4_fsblk_t
- */
-static ext4_fsblk_t ext4_ext_pblock(struct ext4_extent *ex)
-{
- ext4_fsblk_t block;
+ /* Zero the path array because we need to make sure that
+ * lb_id field of block buffer is zero */
+ memset(tpath, 0, sizeof(struct ext4_extent_path) * (depth + 2));
- block = to_le32(ex->start_lo);
- block |= ((ext4_fsblk_t)to_le16(ex->start_hi) << 31) << 1;
- return block;
-}
+ /* Initialize structure for algorithm start */
+ k = depth;
+ tpath[k].block = inode_ref->block;
+ tpath[k].header = eh;
-/*
- * ext4_idx_pblock:
- * combine low and high parts of a leaf physical block number into ext4_fsblk_t
- */
-static ext4_fsblk_t ext4_idx_pblock(struct ext4_extent_index *ix)
-{
- ext4_fsblk_t block;
+ /* Walk through the extent tree */
+ while ((depth = ext4_extent_header_get_depth(eh)) != 0) {
+ /* Search index in index node by iblock */
+ ext4_extent_binsearch_idx(tpath[k].header,
+ &tpath[k].index, iblock);
- block = to_le32(ix->leaf_lo);
- block |= ((ext4_fsblk_t)to_le16(ix->leaf_hi) << 31) << 1;
- return block;
-}
+ tpath[k].depth = depth;
+ tpath[k].extent = NULL;
-/*
- * ext4_ext_store_pblock:
- * stores a large physical block number into an extent struct,
- * breaking it into parts
- */
-static void ext4_ext_store_pblock(struct ext4_extent *ex, ext4_fsblk_t pb)
-{
- ex->start_lo = to_le32((uint32_t)(pb & 0xffffffff));
- ex->start_hi = to_le16((uint16_t)((pb >> 32)) & 0xffff);
-}
+ ext4_assert(tpath[k].index != 0);
-/*
- * ext4_idx_store_pblock:
- * stores a large physical block number into an index struct,
- * breaking it into parts
- */
-static void ext4_idx_store_pblock(struct ext4_extent_index *ix, ext4_fsblk_t pb)
-{
- ix->leaf_lo = to_le32((uint32_t)(pb & 0xffffffff));
- ix->leaf_hi = to_le16((uint16_t)((pb >> 32)) & 0xffff);
-}
+ /* Load information for the next iteration */
+ uint64_t fblock =
+ ext4_extent_index_get_fblock(tpath[k].index);
-static int ext4_allocate_single_block(struct ext4_inode_ref *inode_ref,
- ext4_fsblk_t goal, ext4_fsblk_t *blockp)
-{
- return ext4_balloc_alloc_block(inode_ref, goal, blockp);
-}
+ struct ext4_block block;
+ ret = ext4_trans_block_get(inode_ref->fs->bdev, &block, fblock);
+ if (ret != EOK)
+ goto errout0;
-static ext4_fsblk_t ext4_new_meta_blocks(struct ext4_inode_ref *inode_ref,
- ext4_fsblk_t goal,
- uint32_t flags __unused,
- uint32_t *count, int *errp)
-{
- ext4_fsblk_t block = 0;
+ if (!ext4_extent_block_verify(inode_ref, &block, depth - 1)) {
+ ret = EIO;
+ goto errout0;
+ }
- USED(flags);
+ k--;
- *errp = ext4_allocate_single_block(inode_ref, goal, &block);
- if (count)
- *count = 1;
- return block;
-}
+ eh = (struct ext4_extent_header *)block.data;
+ tpath[k].block = block;
+ tpath[k].header = eh;
+ }
-static void ext4_ext_free_blocks(struct ext4_inode_ref *inode_ref,
- ext4_fsblk_t block, uint32_t count,
- uint32_t flags __unused)
-{
- USED(flags);
- ext4_balloc_free_blocks(inode_ref, block, count);
-}
+ tpath[k].depth = 0;
+ tpath[k].extent = NULL;
+ tpath[k].index = NULL;
-static uint16_t ext4_ext_space_block(struct ext4_inode_ref *inode_ref)
-{
- uint16_t size;
- uint32_t block_size = ext4_sb_get_block_size(&inode_ref->fs->sb);
+ /* Find extent in the leaf node */
+ ext4_extent_binsearch(tpath[k].header, &tpath[k].extent,
+ iblock);
+ *ppath = tpath;
- size = (block_size - sizeof(struct ext4_extent_header)) /
- sizeof(struct ext4_extent);
-#ifdef AGGRESSIVE_TEST
- if (size > 6)
- size = 6;
-#endif
- return size;
-}
+ return EOK;
-static uint16_t ext4_ext_space_block_idx(struct ext4_inode_ref *inode_ref)
-{
- uint16_t size;
- uint32_t block_size = ext4_sb_get_block_size(&inode_ref->fs->sb);
+errout0:
+ /* Put loaded blocks */
+ ext4_extent_path_release(inode_ref, tpath);
- size = (block_size - sizeof(struct ext4_extent_header)) /
- sizeof(struct ext4_extent_index);
-#ifdef AGGRESSIVE_TEST
- if (size > 5)
- size = 5;
-#endif
- return size;
+ /* Destroy temporary data structure */
+ ext4_free(tpath);
+
+ return ret;
}
-static uint16_t ext4_ext_space_root(struct ext4_inode_ref *inode_ref)
+/**@brief Reload the paths in a cursor starting from the level having invalid
+ * pointer
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree
+ * @param depth The level to start the reload at
+ * @param right Try to load the rightmost children
+ * @return EOK on success, EIO on corrupted block, or return values of
+ * ext4_trans_block_get(). */
+int ext4_extent_reload_paths(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ uint16_t depth,
+ bool right)
{
- uint16_t size;
+ int ret = EOK;
+ struct ext4_extent_header *header;
+ struct ext4_extent_path *p;
- USED(inode_ref);
- size = sizeof(inode_ref->inode->blocks);
- size -= sizeof(struct ext4_extent_header);
- size /= sizeof(struct ext4_extent);
-#ifdef AGGRESSIVE_TEST
- if (size > 3)
- size = 3;
-#endif
- return size;
-}
+ /* actually we assume our caller starting from index level instead of
+ * extent level */
+ ext4_assert(depth);
-static uint16_t ext4_ext_space_root_idx(struct ext4_inode_ref *inode_ref)
-{
- uint16_t size;
+ p = path + depth;
+ header = p->header;
- USED(inode_ref);
- size = sizeof(inode_ref->inode->blocks);
- size -= sizeof(struct ext4_extent_header);
- size /= sizeof(struct ext4_extent_index);
-#ifdef AGGRESSIVE_TEST
- if (size > 4)
- size = 4;
-#endif
- return size;
-}
+ /* XXX: the path becomes invalid at the first place... */
+ if (p->index > EXT4_EXTENT_LAST_INDEX(header))
+ p->index = EXT4_EXTENT_LAST_INDEX(header);
-static uint16_t ext4_ext_max_entries(struct ext4_inode_ref *inode_ref,
- uint32_t depth)
-{
- uint16_t max;
+ /* Start reloading all the paths from the child of the specified level
+ * toward the leaf */
+ for (; p > path; --p) {
+ struct ext4_extent_path *chldp;
+ struct ext4_extent_index *idx;
- if (depth == ext_depth(inode_ref->inode)) {
- if (depth == 0)
- max = ext4_ext_space_root(inode_ref);
- else
- max = ext4_ext_space_root_idx(inode_ref);
- } else {
- if (depth == 0)
- max = ext4_ext_space_block(inode_ref);
- else
- max = ext4_ext_space_block_idx(inode_ref);
- }
+ chldp = p - 1;
+ header = p->header; USED(header);
+ idx = p->index;
- return max;
+ /* Release the buffer of child path if the buffer is still
+ * valid */
+ if (chldp->block.lb_id) {
+ ret = ext4_block_set(inode_ref->fs->bdev, &chldp->block);
+ if (ret != EOK)
+ goto out;
+ }
+
+ /* Read the block specified by the physical block field of the
+ * index */
+ ret = ext4_trans_block_get(inode_ref->fs->bdev, &chldp->block,
+ ext4_extent_index_get_fblock(idx));
+ if (ret != EOK)
+ goto out;
+
+ header = (struct ext4_extent_header *)chldp->block.data;
+ /* Validate the block content before moving on. */
+ if (!ext4_extent_block_verify(inode_ref,
+ &chldp->block, p->depth - 1)) {
+ ret = EIO;
+ goto out;
+ }
+
+ /* Reset the fields of child path */
+ chldp->header = header;
+ chldp->depth = ext4_extent_header_get_depth(header);
+ if (right) {
+ if (chldp->depth) {
+ chldp->index = EXT4_EXTENT_LAST_INDEX(header);
+ chldp->extent = NULL;
+ } else {
+ chldp->extent = EXT4_EXTENT_LAST(header);
+ chldp->index = NULL;
+ }
+ } else {
+ if (chldp->depth) {
+ chldp->index = EXT4_EXTENT_FIRST_INDEX(header);
+ chldp->extent = NULL;
+ } else {
+ chldp->extent = EXT4_EXTENT_FIRST(header);
+ chldp->index = NULL;
+ }
+ }
+ }
+out:
+ return ret;
}
-static ext4_fsblk_t ext4_ext_find_goal(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path,
- ext4_lblk_t block)
+/**@brief Seek to the next extent
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree
+ * @param nonextp Output value - whether the current extent is the
+ * right-most extent already
+ * @return 0 on success, EIO on currupted block, or return values of
+ * ext4_trans_block_get(). */
+int ext4_extent_increment(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ bool *nonextp)
{
- if (path) {
- uint32_t depth = path->depth;
- struct ext4_extent *ex;
+ int ret = EOK;
+ uint16_t ptr;
+ bool nonext = true;
+ uint16_t depth = 0;
+ struct ext4_extent_path *p;
+ uint16_t rootdepth;
- /*
- * Try to predict block placement assuming that we are
- * filling in a file which will eventually be
- * non-sparse --- i.e., in the case of libbfd writing
- * an ELF object sections out-of-order but in a way
- * the eventually results in a contiguous object or
- * executable file, or some database extending a table
- * space file. However, this is actually somewhat
- * non-ideal if we are writing a sparse file such as
- * qemu or KVM writing a raw image file that is going
- * to stay fairly sparse, since it will end up
- * fragmenting the file system's free space. Maybe we
- * should have some hueristics or some way to allow
- * userspace to pass a hint to file system,
- * especially if the latter case turns out to be
- * common.
- */
- ex = path[depth].extent;
- if (ex) {
- ext4_fsblk_t ext_pblk = ext4_ext_pblock(ex);
- ext4_lblk_t ext_block = to_le32(ex->first_block);
+ p = path;
+ rootdepth = ext4_extent_tree_depth(inode_ref);
- if (block > ext_block)
- return ext_pblk + (block - ext_block);
- else
- return ext_pblk - (ext_block - block);
+ /* Iterate the paths from the leaf to the root */
+ while (depth <= rootdepth) {
+ struct ext4_extent_header *header;
+
+ if (p->depth) {
+ ptr = p->index -
+ EXT4_EXTENT_FIRST_INDEX(p->header);
+ } else {
+ ptr = p->extent -
+ EXT4_EXTENT_FIRST(p->header);
}
- /* it looks like index is empty;
- * try to find starting block from index itself */
- if (path[depth].block.lb_id)
- return path[depth].block.lb_id;
- }
+ header = p->header;
- /* OK. use inode's group */
- return ext4_fs_inode_to_goal_block(inode_ref);
-}
+ if (ptr < ext4_extent_header_get_nentries(header) - 1)
+ /* We found a path with non-rightmost pointer */
+ break;
-/*
- * Allocation for a meta data block
- */
-static ext4_fsblk_t ext4_ext_new_meta_block(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path,
- struct ext4_extent *ex, int *err,
- uint32_t flags)
-{
- ext4_fsblk_t goal, newblock;
+ /* Move to the parent path */
+ p++;
+ depth++;
+ }
- goal = ext4_ext_find_goal(inode_ref, path, to_le32(ex->first_block));
- newblock = ext4_new_meta_blocks(inode_ref, goal, flags, NULL, err);
- return newblock;
-}
+ /* If we can't find a path with a non-rightmost pointer,
+ * we are already on the last extent, just return in this
+ * case */
+ if (depth > rootdepth)
+ goto out;
-#if CONFIG_META_CSUM_ENABLE
-static uint32_t ext4_ext_block_csum(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_header *eh)
-{
- uint32_t checksum = 0;
- struct ext4_sblock *sb = &inode_ref->fs->sb;
+ /* Increment the pointer once we found a path with non-rightmost
+ * pointer */
+ if (p->depth)
+ p->index++;
+ else
+ p->extent++;
- if (ext4_sb_feature_ro_com(sb, EXT4_FRO_COM_METADATA_CSUM)) {
- uint32_t ino_index = to_le32(inode_ref->index);
- uint32_t ino_gen =
- to_le32(ext4_inode_get_generation(inode_ref->inode));
- /* First calculate crc32 checksum against fs uuid */
- checksum =
- ext4_crc32c(EXT4_CRC32_INIT, sb->uuid, sizeof(sb->uuid));
- /* Then calculate crc32 checksum against inode number
- * and inode generation */
- checksum = ext4_crc32c(checksum, &ino_index, sizeof(ino_index));
- checksum = ext4_crc32c(checksum, &ino_gen, sizeof(ino_gen));
- /* Finally calculate crc32 checksum against
- * the entire extent block up to the checksum field */
- checksum =
- ext4_crc32c(checksum, eh, EXT4_EXTENT_TAIL_OFFSET(eh));
+ if (depth) {
+ /* We need to reload the paths to leaf if the path iterator
+ * is not pointing to the leaf */
+ ret = ext4_extent_reload_paths(inode_ref, path, depth, false);
+ if (ret != EOK)
+ goto out;
}
- return checksum;
-}
-#else
-#define ext4_ext_block_csum(...) 0
-#endif
-static void
-ext4_extent_block_csum_set(struct ext4_inode_ref *inode_ref __unused,
- struct ext4_extent_header *eh)
-{
- struct ext4_extent_tail *tail;
+ /* Found the next extent */
+ nonext = false;
+out:
+ if (nonextp)
+ *nonextp = nonext;
- tail = find_ext4_extent_tail(eh);
- tail->et_checksum = to_le32(ext4_ext_block_csum(inode_ref, eh));
+ return ret;
}
-static int ext4_ext_dirty(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path)
+/**@brief Seek to the previous extent
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree
+ * @param noprevp Output value - whether the current extent is the
+ * left-most extent already
+ * @return 0 on success, EIO on currupted block, or return values of
+ * ext4_trans_block_get(). */
+int
+ext4_extent_decrement(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ bool *noprevp)
{
- if (path->block.lb_id)
- ext4_trans_set_block_dirty(path->block.buf);
- else
- inode_ref->dirty = true;
+ int ret = EOK;
+ uint16_t ptr;
+ bool noprev = true;
+ uint16_t depth = 0;
+ struct ext4_extent_path *p;
+ uint16_t rootdepth;
- return EOK;
-}
+ p = path;
+ rootdepth = ext4_extent_tree_depth(inode_ref);
-static void ext4_ext_drop_refs(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path, bool keep_other)
-{
- int32_t depth, i;
+ /* Iterate the paths from the leaf to the root */
+ while (depth <= rootdepth) {
+ if (p->depth) {
+ ptr = p->index -
+ EXT4_EXTENT_FIRST_INDEX(p->header);
+ } else {
+ ptr = p->extent -
+ EXT4_EXTENT_FIRST(p->header);
+ }
- if (!path)
- return;
- if (keep_other)
- depth = 0;
- else
- depth = path->depth;
+ if (ptr)
+ /* We found a path with non-leftmost pointer */
+ break;
- for (i = 0; i <= depth; i++, path++) {
- if (path->block.lb_id) {
- if (ext4_bcache_test_flag(path->block.buf, BC_DIRTY))
- ext4_extent_block_csum_set(inode_ref,
- path->header);
+ /* Move to the parent path */
+ p++;
+ depth++;
+ }
- ext4_block_set(inode_ref->fs->bdev, &path->block);
- }
+ /* If we can't find a path with a non-leftmost pointer,
+ * we are already on the first extent, just return in this
+ * case */
+ if (depth > rootdepth)
+ goto out;
+
+ /* Decrement the pointer once we found a path with non-leftmost
+ * pointer */
+ if (p->depth)
+ p->index--;
+ else
+ p->extent--;
+
+ if (depth) {
+ /* We need to reload the paths to leaf if the path iterator
+ * is not pointing to the leaf */
+ ret = ext4_extent_reload_paths(inode_ref, path, depth, true);
+ if (ret != EOK)
+ goto out;
}
+
+ /* Found the previous extent */
+ noprev = false;
+out:
+ if (noprevp)
+ *noprevp = noprev;
+ return ret;
}
-/*
- * Check that whether the basic information inside the extent header
- * is correct or not.
- */
-static int ext4_ext_check(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_header *eh, uint16_t depth,
- ext4_fsblk_t pblk __unused)
+
+/**@brief Update the index of nodes starting from leaf
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree
+ * @param force set this to true if insertion, deletion or modification
+ * of starting logical block of the first index in a node is made at non-leaf
+ * level */
+static void ext4_extent_update_index(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ bool force)
{
- struct ext4_extent_tail *tail;
- struct ext4_sblock *sb = &inode_ref->fs->sb;
- const char *error_msg;
+ uint16_t rootdepth;
+ struct ext4_extent_path *p;
- USED(pblk);
+ rootdepth = ext4_extent_tree_depth(inode_ref);
- if (to_le16(eh->magic) != EXT4_EXTENT_MAGIC) {
- error_msg = "invalid magic";
- goto corrupted;
- }
- if (to_le16(eh->depth) != depth) {
- error_msg = "unexpected eh_depth";
- goto corrupted;
- }
- if (eh->max_entries_count == 0) {
- error_msg = "invalid eh_max";
- goto corrupted;
- }
- if (to_le16(eh->entries_count) > to_le16(eh->max_entries_count)) {
- error_msg = "invalid eh_entries";
- goto corrupted;
- }
+ /* Iterate the paths from the parent of the leaf to the root */
+ for (p = path + 1; p <= path + rootdepth; p++) {
+ struct ext4_extent_path *chldp;
+ struct ext4_extent_header *child_header;
+ ptrdiff_t chldptr;
- tail = find_ext4_extent_tail(eh);
- if (ext4_sb_feature_ro_com(sb, EXT4_FRO_COM_METADATA_CSUM)) {
- if (tail->et_checksum !=
- to_le32(ext4_ext_block_csum(inode_ref, eh))) {
- ext4_dbg(DEBUG_EXTENT,
- DBG_WARN "Extent block checksum failed."
- "Blocknr: %" PRIu64 "\n",
- pblk);
- }
- }
+ /* This points to the child path of the current path */
+ chldp = p - 1;
+ child_header = chldp->header;
- return EOK;
+ if (!chldp->depth)
+ chldptr = chldp->extent -
+ EXT4_EXTENT_FIRST(child_header);
+ else
+ chldptr = chldp->index -
+ EXT4_EXTENT_FIRST_INDEX(child_header);
-corrupted:
- USED(error_msg);
- ext4_dbg(DEBUG_EXTENT, "Bad extents B+ tree block: %s. "
- "Blocknr: %" PRId64 "\n",
- error_msg, pblk);
- return EIO;
-}
+ /* If the modification on the child node is not made on the
+ * first slot of the node, we are done */
+ if (chldptr)
+ break;
-static int read_extent_tree_block(struct ext4_inode_ref *inode_ref,
- ext4_fsblk_t pblk, int32_t depth,
- struct ext4_block *bh,
- uint32_t flags __unused)
-{
- int err;
+ if (p->depth > 1) {
+ struct ext4_extent_index *idx = p->index;
+ struct ext4_extent_index *chldidx =
+ chldp->index;
+ ext4_lblk_t iblock, chldiblock;
- USED(flags);
- err = ext4_trans_block_get(inode_ref->fs->bdev, bh, pblk);
- if (err != EOK)
- goto errout;
+ iblock = ext4_extent_index_get_iblock(idx);
+ chldiblock = ext4_extent_index_get_iblock(chldidx);
- err = ext4_ext_check(inode_ref, ext_block_hdr(bh), depth, pblk);
- if (err != EOK)
- goto errout;
+ if (iblock != chldiblock) {
+ /* If the starting logical block of the first
+ * index of the child node is modified, we
+ * update the starting logical block of index
+ * pointing to the child node */
+ ext4_extent_index_set_iblock(idx, chldiblock);
+ ext4_extent_path_dirty(inode_ref, path,
+ p->depth);
+ } else if (!force)
+ /* We do not need to continue the iteration */
+ break;
+ } else {
+ struct ext4_extent_index *idx = p->index;
+ struct ext4_extent *chldext = chldp->extent;
+ ext4_lblk_t iblock, chldiblock;
- return EOK;
-errout:
- if (bh->lb_id)
- ext4_block_set(inode_ref->fs->bdev, bh);
+ iblock = ext4_extent_index_get_iblock(idx);
+ chldiblock = ext4_extent_get_iblock(chldext);
- return err;
+ if (iblock != chldiblock) {
+ /* If the starting logical block of the first
+ * extent of the child node is modified, we
+ * update the starting logical block of index
+ * pointing to the child node */
+ ext4_extent_index_set_iblock(idx, chldiblock);
+ ext4_extent_path_dirty(inode_ref, path,
+ p->depth);
+ } else if (!force)
+ /* We do not need to continue the iteration */
+ break;
+ }
+ };
}
-/*
- * ext4_ext_binsearch_idx:
- * binary search for the closest index of the given block
- * the header must be checked before calling this
- */
-static void ext4_ext_binsearch_idx(struct ext4_extent_path *path,
- ext4_lblk_t block)
+/**@brief Make the tree grow up by one level
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree
+ * @param new_fblock The newly allocated block for tree growth
+ * @return Error code */
+static int ext4_extent_grow_tree(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ ext4_fsblk_t newfblock)
{
- struct ext4_extent_header *eh = path->header;
- struct ext4_extent_index *r, *l, *m;
+ int rc;
+ uint16_t ptr;
+ struct ext4_block block;
+ ext4_lblk_t chldiblock;
+ uint16_t rootdepth;
+ struct ext4_block rootblock;
+ struct ext4_extent_header *rooteh;
+ struct ext4_extent_path *nrootp;
+ struct ext4_extent_path *rootp;
+ uint32_t blocksz;
+ uint16_t maxnentries;
- l = EXT_FIRST_INDEX(eh) + 1;
- r = EXT_LAST_INDEX(eh);
- while (l <= r) {
- m = l + (r - l) / 2;
- if (block < to_le32(m->first_block))
- r = m - 1;
- else
- l = m + 1;
+ rootdepth = ext4_extent_tree_depth(inode_ref);
+ rootp = path + rootdepth;
+ nrootp = rootp + 1;
+ rootblock = rootp->block;
+ rooteh = rootp->header;
+ blocksz = ext4_sb_get_block_size(&inode_ref->fs->sb);
+
+ /* Store the extent/index offset so that we can recover the
+ * pointer to it later */
+ if (rootdepth) {
+ ptr = rootp->index -
+ EXT4_EXTENT_FIRST_INDEX(rootp->header);
+ } else {
+ ptr = rootp->extent -
+ EXT4_EXTENT_FIRST(rootp->header);
}
+ /* Prepare a buffer for newly allocated block */
+ rc = ext4_trans_block_get_noread(inode_ref->fs->bdev, &block, newfblock);
+ if (rc != EOK)
+ return rc;
- path->index = l - 1;
-}
+ /* Initialize newly allocated block */
+ memset(block.data, 0, blocksz);
-/*
- * ext4_ext_binsearch:
- * binary search for closest extent of the given block
- * the header must be checked before calling this
- */
-static void ext4_ext_binsearch(struct ext4_extent_path *path, ext4_lblk_t block)
-{
- struct ext4_extent_header *eh = path->header;
- struct ext4_extent *r, *l, *m;
+ /* Move data from root to the new block */
+ memcpy(block.data, inode_ref->inode->blocks,
+ EXT4_INODE_BLOCKS * sizeof(uint32_t));
- if (eh->entries_count == 0) {
- /*
- * this leaf is empty:
- * we get such a leaf in split/add case
- */
- return;
+ /* Update old root path */
+ rootp->block = block;
+ rootp->header = (struct ext4_extent_header *)block.data;
+ if (rootp->depth) {
+ rootp->index =
+ EXT4_EXTENT_FIRST_INDEX(rootp->header) +
+ ptr;
+
+ maxnentries =
+ (blocksz - sizeof(struct ext4_extent_header)) /
+ sizeof(struct ext4_extent_index);
+#if CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ maxnentries = 5;
+#endif /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ rootp->extent = NULL;
+ chldiblock =
+ ext4_extent_index_get_iblock(EXT4_EXTENT_FIRST_INDEX(rootp->header));
+ } else {
+ rootp->extent =
+ EXT4_EXTENT_FIRST(rootp->header) +
+ ptr;
+ maxnentries =
+ (blocksz - sizeof(struct ext4_extent_header)) /
+ sizeof(struct ext4_extent);
+#if CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ maxnentries = 5;
+#endif /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ rootp->index = NULL;
+ chldiblock =
+ ext4_extent_get_iblock(EXT4_EXTENT_FIRST(rootp->header));
}
- l = EXT_FIRST_EXTENT(eh) + 1;
- r = EXT_LAST_EXTENT(eh);
+ /* Re-initialize new root metadata */
+ nrootp->depth = rootdepth + 1;
+ nrootp->block = rootblock;
+ nrootp->header = rooteh;
+ nrootp->extent = NULL;
+ nrootp->index = EXT4_EXTENT_FIRST_INDEX(nrootp->header);
- while (l <= r) {
- m = l + (r - l) / 2;
- if (block < to_le32(m->first_block))
- r = m - 1;
- else
- l = m + 1;
- }
+ ext4_extent_header_set_depth(nrootp->header, nrootp->depth);
- path->extent = l - 1;
+ /* Create new entry in root */
+ ext4_extent_header_set_nentries(nrootp->header, 1);
+ ext4_extent_index_set_iblock(nrootp->index, chldiblock);
+ ext4_extent_index_set_fblock(nrootp->index, newfblock);
+
+ /* Since new_root belongs to on-disk inode,
+ * we don't do checksum here */
+ inode_ref->dirty = true;
+
+ /* Set upper limit for entries count of old root */
+ ext4_extent_header_set_max_nentries(rootp->header, maxnentries);
+
+ ext4_extent_path_dirty(inode_ref, path, rootp->depth);
+
+ return EOK;
}
-static int ext4_find_extent(struct ext4_inode_ref *inode_ref, ext4_lblk_t block,
- struct ext4_extent_path **orig_path, uint32_t flags)
+/**@brief Do splitting on the tree if the leaf is full
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree for possible splitting
+ * @param nslots number of entries that will be inserted to the
+ * leaf in future.
+ * @return Error code */
+static int ext4_extent_split(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ uint16_t nslots)
{
- struct ext4_extent_header *eh;
- struct ext4_block bh = EXT4_BLOCK_ZERO();
- ext4_fsblk_t buf_block;
- struct ext4_extent_path *path = *orig_path;
- int32_t depth, ppos = 0;
- int32_t i;
int ret;
+ uint16_t i;
+ ext4_fsblk_t goal;
+ uint16_t rootdepth;
+ struct ext4_extent_path *p;
+ uint32_t blocksz;
+ /* Number of new blocks to be allocated */
+ uint16_t nnewfblocks = 0;
+ /* Number of node to be split */
+ uint16_t nsplits = 0;
+ /* Array of new blocks allocated */
+ ext4_fsblk_t *newfblocks;
+ /* The index of the right block inserted last time */
+ ext4_lblk_t lastiblock = 0;
+ /* Whether we updated child path to point to the right block
+ * at the previous round during splitting */
+ bool prevrblock = false;
- eh = ext_inode_hdr(inode_ref->inode);
- depth = ext_depth(inode_ref->inode);
+ blocksz = ext4_sb_get_block_size(&inode_ref->fs->sb);
+ rootdepth = ext4_extent_tree_depth(inode_ref);
+ goal = ext4_extent_tree_alloc_goal(inode_ref);
- if (path) {
- ext4_ext_drop_refs(inode_ref, path, 0);
- if (depth > path[0].maxdepth) {
- ext4_free(path);
- *orig_path = path = NULL;
+ /* First calculate how many levels will be touched */
+ for (p = path; p <= path + rootdepth; p++) {
+ uint16_t entries =
+ ext4_extent_header_get_nentries(p->header);
+ uint16_t limit =
+ ext4_extent_header_get_max_nentries(p->header);
+
+ ext4_assert(entries <= limit);
+ if (!p->depth) {
+ if (entries + nslots <= limit)
+ break;
+ } else {
+ if (entries < limit)
+ break;
}
+ /* We have to split a node when the tree is full */
+ nnewfblocks++;
+ nsplits++;
}
- if (!path) {
- int32_t path_depth = depth + 1;
- /* account possible depth increase */
- path = ext4_calloc(1, sizeof(struct ext4_extent_path) *
- (path_depth + 1));
- if (!path)
- return ENOMEM;
- path[0].maxdepth = path_depth;
- }
- path[0].header = eh;
- path[0].block = bh;
- i = depth;
- /* walk through the tree */
- while (i) {
- ext4_ext_binsearch_idx(path + ppos, block);
- path[ppos].p_block = ext4_idx_pblock(path[ppos].index);
- path[ppos].depth = i;
- path[ppos].extent = NULL;
- buf_block = path[ppos].p_block;
+ if (!nnewfblocks)
+ return EOK;
- i--;
- ppos++;
- if (!path[ppos].block.lb_id ||
- path[ppos].block.lb_id != buf_block) {
- ret = read_extent_tree_block(inode_ref, buf_block, i,
- &bh, flags);
- if (ret != EOK) {
- goto err;
- }
- if (ppos > depth) {
- ext4_block_set(inode_ref->fs->bdev, &bh);
- ret = EIO;
- goto err;
- }
+ /* Allocate the array for storing newly allocated blocks */
+ newfblocks = ext4_malloc(sizeof(ext4_fsblk_t) * nnewfblocks);
+ if (!newfblocks)
+ return ENOMEM;
- eh = ext_block_hdr(&bh);
- path[ppos].block = bh;
- path[ppos].header = eh;
- }
+ for (i = 0; i < nnewfblocks; i++) {
+ ret = ext4_balloc_alloc_block(inode_ref, goal, newfblocks + i);
+ if (ret != EOK)
+ return ret;
}
- path[ppos].depth = i;
- path[ppos].extent = NULL;
- path[ppos].index = NULL;
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "nnewfblocks: %" PRIu16 " rootdepth: %" PRIu16 "\n",
+ nnewfblocks, rootdepth);
- /* find extent */
- ext4_ext_binsearch(path + ppos, block);
- /* if not an empty leaf */
- if (path[ppos].extent)
- path[ppos].p_block = ext4_ext_pblock(path[ppos].extent);
+ /* If number of blocks to be allocated is greater than
+ * the depth of root we have to grow the tree */
+ if (nnewfblocks == rootdepth + 1) {
+ ext4_dbg(DEBUG_EXTENT, "Growing: \n");
+ nsplits--;
- *orig_path = path;
+ ret = ext4_extent_grow_tree(inode_ref,
+ path, newfblocks[rootdepth]);
+ if (ret != EOK)
+ goto finish;
- ret = EOK;
- return ret;
+ ext4_extent_print_path(inode_ref, path);
-err:
- ext4_ext_drop_refs(inode_ref, path, 0);
- ext4_free(path);
- if (orig_path)
- *orig_path = NULL;
- return ret;
-}
+ /* If we are moving the in-inode leaf to on-block leaf.
+ * we do not need further actions. */
+ if (!rootdepth)
+ goto finish;
-static void ext4_ext_init_header(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_header *eh, int32_t depth)
-{
- eh->entries_count = 0;
- eh->max_entries_count = to_le16(ext4_ext_max_entries(inode_ref, depth));
- eh->magic = to_le16(EXT4_EXTENT_MAGIC);
- eh->depth = depth;
-}
+ ++rootdepth; USED(rootdepth);
+ }
-static int ext4_ext_insert_index(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path, int at,
- ext4_lblk_t insert_index,
- ext4_fsblk_t insert_block, bool set_to_ix)
-{
- struct ext4_extent_index *ix;
- struct ext4_extent_path *curp = path + at;
- int len, err;
- struct ext4_extent_header *eh;
+ /* Start splitting */
+ p = path;
+ ext4_dbg(DEBUG_EXTENT, DBG_INFO "Start splitting: \n");
+ for (i = 0; i < nsplits; i++, p++) {
+ struct ext4_extent_header *header;
+ uint16_t entries =
+ ext4_extent_header_get_nentries(p->header);
+ uint16_t limit =
+ ext4_extent_header_get_max_nentries(p->header);
+ /* The entry we start shifting to the right block */
+ uint16_t split_ptr = entries / 2;
+ /* The number of entry the right block will have */
+ uint16_t right_entries = entries - split_ptr;
+ /* The current entry */
+ uint16_t curr_ptr;
+ ext4_lblk_t riblock;
+ struct ext4_block block;
- if (curp->index && insert_index == to_le32(curp->index->first_block))
- return EIO;
+ ret = ext4_trans_block_get_noread(inode_ref->fs->bdev,
+ &block, newfblocks[i]);
+ if (ret != EOK)
+ goto finish;
- if (to_le16(curp->header->entries_count) ==
- to_le16(curp->header->max_entries_count))
- return EIO;
+ /* Initialize newly allocated block and remember it */
+ memset(block.data, 0, blocksz);
- eh = curp->header;
- if (curp->index == NULL) {
- ix = EXT_FIRST_INDEX(eh);
- curp->index = ix;
- } else if (insert_index > to_le32(curp->index->first_block)) {
- /* insert after */
- ix = curp->index + 1;
- } else {
- /* insert before */
- ix = curp->index;
- }
+ header = (void *)block.data;
- if (ix > EXT_MAX_INDEX(eh))
- return EIO;
+ /* Initialize on-disk structure (header) */
+ ext4_extent_header_set_nentries(header,
+ right_entries);
+ ext4_extent_header_set_max_nentries(header, limit);
+ ext4_extent_header_set_magic(header, EXT4_EXTENT_MAGIC);
+ ext4_extent_header_set_depth(header, p->depth);
+ ext4_extent_header_set_generation(header, 0);
- len = EXT_LAST_INDEX(eh) - ix + 1;
- ext4_assert(len >= 0);
- if (len > 0)
- memmove(ix + 1, ix, len * sizeof(struct ext4_extent_index));
+ /* Move some entries from old block to new block */
+ if (p->depth) {
+ struct ext4_extent_index *left_index =
+ EXT4_EXTENT_FIRST_INDEX(p->header);
+ struct ext4_extent_index *split_index =
+ left_index + split_ptr;
- ix->first_block = to_le32(insert_index);
- ext4_idx_store_pblock(ix, insert_block);
- eh->entries_count = to_le16(to_le16(eh->entries_count) + 1);
+ riblock = ext4_extent_index_get_iblock(split_index);
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "depth: %" PRIu32 ", riblock: %" PRIu32 "\n",
+ p->depth, riblock);
- if (ix > EXT_LAST_INDEX(eh)) {
- err = EIO;
- goto out;
- }
+ curr_ptr = p->index - left_index;
- err = ext4_ext_dirty(inode_ref, curp);
+ memcpy(EXT4_EXTENT_FIRST_INDEX(header),
+ split_index,
+ right_entries * EXT4_EXTENT_INDEX_SIZE);
+ memset(split_index, 0,
+ right_entries * EXT4_EXTENT_INDEX_SIZE);
+ } else {
+ struct ext4_extent *left_extent =
+ EXT4_EXTENT_FIRST(p->header);
+ struct ext4_extent *split_extent =
+ left_extent + split_ptr;
-out:
- if (err == EOK && set_to_ix) {
- curp->index = ix;
- curp->p_block = ext4_idx_pblock(ix);
- }
- return err;
-}
+ riblock = ext4_extent_get_iblock(split_extent);
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "depth: %" PRIu32 ", riblock: %" PRIu32 "\n",
+ p->depth, riblock);
-static int ext4_ext_split_node(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path, int at,
- struct ext4_extent *newext,
- struct ext4_extent_path *npath,
- bool *ins_right_leaf)
-{
- int i, npath_at, ret;
- ext4_lblk_t insert_index;
- ext4_fsblk_t newblock;
- int depth = ext_depth(inode_ref->inode);
- npath_at = depth - at;
+ curr_ptr = p->extent - left_extent;
- ext4_assert(at > 0);
+ memcpy(EXT4_EXTENT_FIRST(header),
+ split_extent,
+ right_entries * EXT4_EXTENT_SIZE);
+ memset(split_extent, 0,
+ right_entries * EXT4_EXTENT_SIZE);
+ }
- if (path[depth].extent != EXT_MAX_EXTENT(path[depth].header))
- insert_index = path[depth].extent[1].first_block;
- else
- insert_index = newext->first_block;
+ /* Set entries count in left node */
+ ext4_extent_header_set_nentries(p->header,
+ entries - right_entries);
- for (i = depth; i >= at; i--, npath_at--) {
- struct ext4_block bh = EXT4_BLOCK_ZERO();
+ /* Decide whether we need to update the path to
+ * point to right block or not */
+ if (curr_ptr >= split_ptr) {
+ /* Update the checksum for the left block */
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
- /* FIXME: currently we split at the point after the current
- * extent. */
- newblock =
- ext4_ext_new_meta_block(inode_ref, path, newext, &ret, 0);
- if (ret != EOK)
- goto cleanup;
+ /* Put back the left block */
+ ret = ext4_block_set(inode_ref->fs->bdev,
+ &p->block);
+ if (ret != EOK)
+ goto finish;
- /* For write access.*/
- ret = ext4_trans_block_get_noread(inode_ref->fs->bdev, &bh,
- newblock);
- if (ret != EOK)
- goto cleanup;
+ /* Update pointers in extent path structure to
+ * point to right block */
+ p->block = block;
+ p->header = (void *)block.data;
- if (i == depth) {
- /* start copy from next extent */
- int m = EXT_MAX_EXTENT(path[i].header) - path[i].extent;
- struct ext4_extent_header *neh;
- struct ext4_extent *ex;
- neh = ext_block_hdr(&bh);
- ex = EXT_FIRST_EXTENT(neh);
- ext4_ext_init_header(inode_ref, neh, 0);
- if (m) {
- memmove(ex, path[i].extent + 1,
- sizeof(struct ext4_extent) * m);
- neh->entries_count =
- to_le16(to_le16(neh->entries_count) + m);
- path[i].header->entries_count = to_le16(
- to_le16(path[i].header->entries_count) - m);
- ret = ext4_ext_dirty(inode_ref, path + i);
- if (ret != EOK)
- goto cleanup;
-
- npath[npath_at].p_block = ext4_ext_pblock(ex);
- npath[npath_at].extent = ex;
+ if (p->depth) {
+ p->index =
+ EXT4_EXTENT_FIRST_INDEX(p->header) +
+ curr_ptr - split_ptr;
} else {
- npath[npath_at].p_block = 0;
- npath[npath_at].extent = NULL;
+ p->extent =
+ EXT4_EXTENT_FIRST(p->header) +
+ curr_ptr - split_ptr;
}
+ } else {
+ /* Update the checksum for the right block */
+ ext4_extent_block_csum_set(inode_ref, header);
+ ext4_trans_set_block_dirty(block.buf);
- npath[npath_at].depth = to_le16(neh->depth);
- npath[npath_at].maxdepth = 0;
- npath[npath_at].index = NULL;
- npath[npath_at].header = neh;
- npath[npath_at].block = bh;
+ /* Put back the right block */
+ ret = ext4_block_set(inode_ref->fs->bdev,
+ &block);
+ if (ret != EOK)
+ goto finish;
+ }
- ext4_trans_set_block_dirty(bh.buf);
- } else {
- int m = EXT_MAX_INDEX(path[i].header) - path[i].index;
- struct ext4_extent_header *neh;
- struct ext4_extent_index *ix;
- neh = ext_block_hdr(&bh);
- ix = EXT_FIRST_INDEX(neh);
- ext4_ext_init_header(inode_ref, neh, depth - i);
- ix->first_block = to_le32(insert_index);
- ext4_idx_store_pblock(ix,
- npath[npath_at + 1].block.lb_id);
- neh->entries_count = to_le16(1);
- if (m) {
- memmove(ix + 1, path[i].index + 1,
- sizeof(struct ext4_extent) * m);
- neh->entries_count =
- to_le16(to_le16(neh->entries_count) + m);
- path[i].header->entries_count = to_le16(
- to_le16(path[i].header->entries_count) - m);
- ret = ext4_ext_dirty(inode_ref, path + i);
- if (ret != EOK)
- goto cleanup;
- }
+ /* Append an index after the current index */
+ if (p->depth) {
+ struct ext4_extent_index *index = p->index + 1;
- npath[npath_at].p_block = ext4_idx_pblock(ix);
- npath[npath_at].depth = to_le16(neh->depth);
- npath[npath_at].maxdepth = 0;
- npath[npath_at].extent = NULL;
- npath[npath_at].index = ix;
- npath[npath_at].header = neh;
- npath[npath_at].block = bh;
+ /* If we updated the path to right block in the previous
+ * round, we update the pointer in the path to point to
+ * the right block */
+ if (prevrblock)
+ p->index++;
- ext4_trans_set_block_dirty(bh.buf);
+ if (index <= EXT4_EXTENT_LAST_INDEX(p->header)) {
+ uint16_t nindex =
+ EXT4_EXTENT_LAST_INDEX(p->header) -
+ index + 1;
+
+ memmove(index + 1,
+ index,
+ nindex * EXT4_EXTENT_INDEX_SIZE);
+ }
+ memset(index, 0, EXT4_EXTENT_INDEX_SIZE);
+ ext4_extent_index_set_iblock(index, lastiblock);
+ ext4_extent_index_set_fblock(index, newfblocks[i - 1]);
+
+ entries = ext4_extent_header_get_nentries(p->header);
+ ext4_extent_header_set_nentries(p->header,
+ entries + 1);
}
+
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
+
+ /* We may have updated the path to right block in this round */
+ prevrblock = curr_ptr >= split_ptr;
+
+ /* We also update the lastiblock variable to the index of the
+ * right block */
+ lastiblock = riblock;
}
- newblock = 0;
- /*
- * If newext->first_block can be included into the
- * right sub-tree.
- */
- if (to_le32(newext->first_block) < insert_index)
- *ins_right_leaf = false;
- else
- *ins_right_leaf = true;
+ /* Append an index after the current index */
+ if (p->depth) {
+ struct ext4_extent_index *index = p->index + 1;
+ uint16_t entries =
+ ext4_extent_header_get_nentries(p->header);
- ret = ext4_ext_insert_index(inode_ref, path, at - 1, insert_index,
- npath[0].block.lb_id, *ins_right_leaf);
+ /* If we updated the path to right block in the previous
+ * round, we update the pointer in the path to point to
+ * the right block */
+ if (prevrblock)
+ p->index++;
-cleanup:
- if (ret != EOK) {
- if (newblock)
- ext4_ext_free_blocks(inode_ref, newblock, 1, 0);
+ if (index <= EXT4_EXTENT_LAST_INDEX(p->header)) {
+ uint16_t nindex =
+ EXT4_EXTENT_LAST_INDEX(p->header) -
+ index + 1;
- npath_at = depth - at;
- while (npath_at >= 0) {
- if (npath[npath_at].block.lb_id) {
- newblock = npath[npath_at].block.lb_id;
- ext4_block_set(inode_ref->fs->bdev,
- &npath[npath_at].block);
- ext4_ext_free_blocks(inode_ref, newblock, 1, 0);
- memset(&npath[npath_at].block, 0,
- sizeof(struct ext4_block));
- }
- npath_at--;
+ memmove(index + 1,
+ index,
+ nindex * EXT4_EXTENT_INDEX_SIZE);
}
+ memset(index, 0, EXT4_EXTENT_INDEX_SIZE);
+ ext4_extent_index_set_iblock(index, lastiblock);
+ ext4_extent_index_set_fblock(index, newfblocks[i - 1]);
+ ext4_extent_header_set_nentries(p->header,
+ entries + 1);
+
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
}
+
+ ret = EOK;
+finish:
+ if (ret != EOK)
+ for (i = 0; i < nnewfblocks; i++)
+ ext4_balloc_free_block(inode_ref, newfblocks[i]);
+
+ ext4_free(newfblocks);
return ret;
}
-/*
- * ext4_ext_correct_indexes:
- * if leaf gets modified and modified extent is first in the leaf,
- * then we have to correct all indexes above.
- */
-static int ext4_ext_correct_indexes(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path)
+/**@brief Insert an extent into the extent tree
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree for possible splitting
+ * @param ext Extent to be inserted
+ * @return Error code */
+static int ext4_extent_insert(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ struct ext4_extent *ext)
{
- struct ext4_extent_header *eh;
- int32_t depth = ext_depth(inode_ref->inode);
- struct ext4_extent *ex;
- uint32_t border;
- int32_t k;
- int err;
+ int ret;
+ uint16_t entries;
+ struct ext4_extent_path *p;
- eh = path[depth].header;
- ex = path[depth].extent;
+ /* Split and grow the tree if necessary */
+ ret = ext4_extent_split(inode_ref, path, 1);
+ if (ret != EOK)
+ return ret;
- if (ex == NULL || eh == NULL)
- return EIO;
+ p = path;
+ entries = ext4_extent_header_get_nentries(p->header);
- if (depth == 0) {
- /* there is no tree at all */
- return EOK;
- }
+ ext4_dbg(DEBUG_EXTENT, DBG_INFO "After splitting: \n");
+ ext4_extent_print_path(inode_ref, path);
- if (ex != EXT_FIRST_EXTENT(eh)) {
- /* we correct tree if first leaf got modified only */
- return EOK;
+ if (!p->extent) {
+ p->extent = EXT4_EXTENT_FIRST(p->header);
+ } else {
+ ext4_lblk_t iblock;
+
+ iblock = ext4_extent_get_iblock(p->extent);
+ if (ext4_extent_get_iblock(ext) > iblock)
+ p->extent++;
}
- k = depth - 1;
- border = path[depth].extent->first_block;
- path[k].index->first_block = border;
- err = ext4_ext_dirty(inode_ref, path + k);
- if (err != EOK)
- return err;
+ if (p->extent <= EXT4_EXTENT_LAST(p->header)) {
+ uint16_t nextent =
+ EXT4_EXTENT_LAST(p->header) -
+ p->extent + 1;
- while (k--) {
- /* change all left-side indexes */
- if (path[k + 1].index != EXT_FIRST_INDEX(path[k + 1].header))
- break;
- path[k].index->first_block = border;
- err = ext4_ext_dirty(inode_ref, path + k);
- if (err != EOK)
- break;
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "%" PRIu16 " extents to be shifted at leaf\n",
+ nextent);
+
+ memmove(p->extent + 1,
+ p->extent,
+ nextent * EXT4_EXTENT_SIZE);
}
+ memcpy(p->extent, ext, EXT4_EXTENT_SIZE);
+ ext4_extent_header_set_nentries(p->header,
+ entries + 1);
- return err;
-}
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
-static inline bool ext4_ext_can_prepend(struct ext4_extent *ex1,
- struct ext4_extent *ex2)
-{
- if (ext4_ext_pblock(ex2) + ext4_ext_get_actual_len(ex2) !=
- ext4_ext_pblock(ex1))
- return 0;
+ ext4_dbg(DEBUG_EXTENT, DBG_INFO "Before updating indice: \n");
+ ext4_extent_print_path(inode_ref, path);
-#ifdef AGGRESSIVE_TEST
- if (ext4_ext_get_actual_len(ex1) + ext4_ext_get_actual_len(ex2) > 4)
- return 0;
-#else
- if (ext4_ext_is_unwritten(ex1)) {
- if (ext4_ext_get_actual_len(ex1) +
- ext4_ext_get_actual_len(ex2) >
- EXT_UNWRITTEN_MAX_LEN)
- return 0;
- } else if (ext4_ext_get_actual_len(ex1) + ext4_ext_get_actual_len(ex2) >
- EXT_INIT_MAX_LEN)
- return 0;
-#endif
+ /* Update the index of the first entry in parents node */
+ ext4_extent_update_index(inode_ref, path, false);
- if (to_le32(ex2->first_block) + ext4_ext_get_actual_len(ex2) !=
- to_le32(ex1->first_block))
- return 0;
+ ext4_dbg(DEBUG_EXTENT, DBG_INFO "At the end: \n");
+ ext4_extent_print_path(inode_ref, path);
- return 1;
+ return ret;
}
-static inline bool ext4_ext_can_append(struct ext4_extent *ex1,
- struct ext4_extent *ex2)
+/**@brief Delete an item from the node at @depth pointed
+ * @param inode_ref I-node the extent tree resides in
+ * @param path Path in the extent tree for possible splitting
+ * @param depth The level of the node to be operated on
+ * @return Error code */
+static void
+ext4_extent_delete_item(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ uint16_t depth)
{
- if (ext4_ext_pblock(ex1) + ext4_ext_get_actual_len(ex1) !=
- ext4_ext_pblock(ex2))
- return 0;
+ uint16_t nitems;
+ struct ext4_extent_header *hdr;
+ struct ext4_extent_path *p;
-#ifdef AGGRESSIVE_TEST
- if (ext4_ext_get_actual_len(ex1) + ext4_ext_get_actual_len(ex2) > 4)
- return 0;
-#else
- if (ext4_ext_is_unwritten(ex1)) {
- if (ext4_ext_get_actual_len(ex1) +
- ext4_ext_get_actual_len(ex2) >
- EXT_UNWRITTEN_MAX_LEN)
- return 0;
- } else if (ext4_ext_get_actual_len(ex1) + ext4_ext_get_actual_len(ex2) >
- EXT_INIT_MAX_LEN)
- return 0;
-#endif
+ p = path + depth;
- if (to_le32(ex1->first_block) + ext4_ext_get_actual_len(ex1) !=
- to_le32(ex2->first_block))
- return 0;
+ hdr = p->header;
+ ext4_assert(ext4_extent_header_get_nentries(hdr));
- return 1;
+ if (p->depth) {
+ struct ext4_extent_index *idx;
+
+ idx = p->index;
+ nitems = EXT4_EXTENT_LAST_INDEX(hdr) - (idx + 1) + 1;
+ if (nitems) {
+ memmove(idx, idx + 1,
+ nitems * EXT4_EXTENT_INDEX_SIZE);
+ memset(EXT4_EXTENT_LAST(hdr), 0,
+ EXT4_EXTENT_INDEX_SIZE);
+ } else {
+ memset(idx, 0, EXT4_EXTENT_INDEX_SIZE);
+ }
+ } else {
+ struct ext4_extent *ext;
+
+ ext = p->extent;
+ nitems = EXT4_EXTENT_LAST(hdr) - (ext + 1) + 1;
+ if (nitems) {
+ memmove(ext, ext + 1,
+ nitems * EXT4_EXTENT_SIZE);
+ memset(EXT4_EXTENT_LAST(hdr), 0,
+ EXT4_EXTENT_SIZE);
+ } else {
+ memset(ext, 0, EXT4_EXTENT_SIZE);
+ }
+ }
+
+ nitems = ext4_extent_header_get_nentries(hdr) - 1;
+ ext4_extent_header_set_nentries(hdr,
+ nitems);
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
}
-static int ext4_ext_insert_leaf(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path, int at,
- struct ext4_extent *newext, int flags,
- bool *need_split)
+/**@brief Remove extents in a leaf starting
+ * from the current extent and having
+ * key less than or equal to @toiblock.
+ * @param inode_ref I-node the tree resides in
+ * @param path Path in the extent tree
+ * @param toiblock The logical block
+ * @param stopp Output value to tell whether the caller should
+ * stop deletion. Will be set to true if an extent having key greater
+ * than @toiblock is met.
+ * @return 0 if there is no error, or return values of blocks
+ * freeing routine. */
+static int
+ext4_extent_delete_leaf(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ ext4_lblk_t toiblock,
+ bool *stopp)
{
- struct ext4_extent_path *curp = path + at;
- struct ext4_extent *ex = curp->extent;
- int len, err, unwritten;
- struct ext4_extent_header *eh;
+ int ret = EOK;
+ uint16_t nitems;
+ struct ext4_extent *ext;
+ struct ext4_extent_header *hdr;
+ struct ext4_extent_path *p;
- *need_split = false;
+ p = path;
+ *stopp = false;
- if (curp->extent &&
- to_le32(newext->first_block) == to_le32(curp->extent->first_block))
- return EIO;
+ while (1) {
+ bool unwritten;
+ uint16_t ptr;
+ uint16_t len;
+ uint16_t flen;
+ ext4_lblk_t endiblock;
+ ext4_lblk_t startiblock;
+ ext4_fsblk_t blocknr;
- if (!(flags & EXT4_EXT_NO_COMBINE)) {
- if (curp->extent && ext4_ext_can_append(curp->extent, newext)) {
- unwritten = ext4_ext_is_unwritten(curp->extent);
- curp->extent->block_count =
- to_le16(ext4_ext_get_actual_len(curp->extent) +
- ext4_ext_get_actual_len(newext));
- if (unwritten)
- ext4_ext_mark_unwritten(curp->extent);
+ hdr = p->header;
+ nitems = ext4_extent_header_get_nentries(hdr);
+ ptr = p->extent - EXT4_EXTENT_FIRST(hdr);
- err = ext4_ext_dirty(inode_ref, curp);
- goto out;
- }
+ ext4_assert(nitems > 0);
- if (curp->extent &&
- ext4_ext_can_prepend(curp->extent, newext)) {
- unwritten = ext4_ext_is_unwritten(curp->extent);
- curp->extent->first_block = newext->first_block;
- curp->extent->block_count =
- to_le16(ext4_ext_get_actual_len(curp->extent) +
- ext4_ext_get_actual_len(newext));
- if (unwritten)
- ext4_ext_mark_unwritten(curp->extent);
+ ext = p->extent;
+ blocknr = ext4_extent_get_fblock(ext);
+ startiblock = ext4_extent_get_iblock(ext);
+ endiblock = startiblock + ext4_extent_get_nblocks(ext) - 1;
+ len = endiblock - startiblock + 1;
+ unwritten = EXT4_EXT_IS_UNWRITTEN(ext);
- err = ext4_ext_dirty(inode_ref, curp);
- goto out;
+ /* We have to stop if the extent's key
+ * is greater than @toiblock. */
+ if (toiblock < startiblock) {
+ *stopp = true;
+ break;
}
- }
- if (to_le16(curp->header->entries_count) ==
- to_le16(curp->header->max_entries_count)) {
- err = EIO;
- *need_split = true;
- goto out;
- } else {
- eh = curp->header;
- if (curp->extent == NULL) {
- ex = EXT_FIRST_EXTENT(eh);
- curp->extent = ex;
- } else if (to_le32(newext->first_block) >
- to_le32(curp->extent->first_block)) {
- /* insert after */
- ex = curp->extent + 1;
- } else {
- /* insert before */
- ex = curp->extent;
+ if (toiblock < endiblock) {
+ /* In case @toiblock is smaller than the last
+ * logical block of the extent, we do not
+ * need to delete the extent. We modify it only. */
+
+ /* Unmap the underlying blocks. */
+ flen = toiblock - startiblock + 1;
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Freeing: %" PRIu64 ":%" PRIu16 "\n",
+ blocknr, flen);
+ ext4_balloc_free_blocks(inode_ref, blocknr, flen);
+
+ /* Adjust the starting block and length of the
+ * current extent. */
+ blocknr += flen;
+ startiblock = toiblock + 1;
+ len = endiblock - startiblock + 1;
+ ext4_extent_set_iblock(ext, startiblock);
+ ext4_extent_set_nblocks(ext, len, unwritten);
+ ext4_extent_set_fblock(ext, blocknr);
+
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
+
+ *stopp = 1;
+ break;
}
- }
- len = EXT_LAST_EXTENT(eh) - ex + 1;
- ext4_assert(len >= 0);
- if (len > 0)
- memmove(ex + 1, ex, len * sizeof(struct ext4_extent));
+ /* Delete the extent pointed to by the path. */
+ ext4_extent_delete_item(inode_ref, path, 0);
+ nitems--;
- if (ex > EXT_MAX_EXTENT(eh)) {
- err = EIO;
- goto out;
+ /* Unmap the underlying blocks. */
+ flen = len;
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Freeing: %" PRIu64 ":%" PRIu16 "\n",
+ blocknr, flen);
+ ext4_balloc_free_blocks(inode_ref, blocknr, flen);
+
+ /* There are no more items we could delete. */
+ if (ptr >= nitems)
+ break;
}
+ return ret;
+}
- ex->first_block = newext->first_block;
- ex->block_count = newext->block_count;
- ext4_ext_store_pblock(ex, ext4_ext_pblock(newext));
- eh->entries_count = to_le16(to_le16(eh->entries_count) + 1);
+/**@brief Remove the current index at specified level.
+ * @param cur Cursor to an extent tree
+ * @param depth The level where deletion takes place at
+ * @return 0 if there is no error, or return values of blocks
+ * freeing routine. */
+static int
+ext4_extent_delete_node(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ uint16_t depth)
+{
+ int ret = EOK;
+ ext4_fsblk_t fblock;
+ struct ext4_extent_index *idx;
+ struct ext4_extent_header *hdr;
+ struct ext4_extent_path *p;
- if (ex > EXT_LAST_EXTENT(eh)) {
- err = EIO;
- goto out;
- }
+ /* If we leave nothing in the node after deletion of
+ * an item, we free the block and delete the index
+ * of the node. Get the respective key of the node
+ * in the parent level */
+ p = path + depth;
+ hdr = p->header;
+ ext4_assert(ext4_extent_header_get_nentries(hdr) > 0);
+ idx = p->index;
+ fblock = ext4_extent_index_get_fblock(idx);
- err = ext4_ext_correct_indexes(inode_ref, path);
- if (err != EOK)
- goto out;
- err = ext4_ext_dirty(inode_ref, curp);
+ /* Delete the index pointed to by the path. */
+ ext4_extent_delete_item(inode_ref, path, depth);
-out:
- if (err == EOK) {
- curp->extent = ex;
- curp->p_block = ext4_ext_pblock(ex);
- }
+ /* Free the block of it. */
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Freeing: %" PRIu64 ":%" PRIu16 "\n",
+ fblock, 1);
+ ext4_balloc_free_blocks(inode_ref, fblock, 1);
- return err;
+ return ret;
}
-/*
- * ext4_ext_grow_indepth:
- * implements tree growing procedure:
- * - allocates new block
- * - moves top-level data (index block or leaf) into the new block
- * - initializes new top-level, creating index that points to the
- * just created block
+/**@brief Delete the mapping in extent tree starting from \p fromiblock to
+ * \p toiblock inclusively.
+ * @param cur Cursor to an extent tree
+ * @return 0 on success, ENOENT if there is no item to be deleted,
+ * return values of ext4_ext_increment(), ext4_ext_insert(),
+ * ext4_ext_delete_leaf(), ext4_ext_delete_node() ext4_ext_reload_paths(),
+ * ext4_ext_tree_shrink(). Cursor MUST be discarded after deletion.
*/
-static int ext4_ext_grow_indepth(struct ext4_inode_ref *inode_ref,
- uint32_t flags)
+int ext4_extent_remove_space(struct ext4_inode_ref *inode_ref,
+ ext4_lblk_t fromiblock,
+ ext4_lblk_t toiblock)
{
- struct ext4_extent_header *neh;
- struct ext4_block bh = EXT4_BLOCK_ZERO();
- ext4_fsblk_t newblock, goal;
- int err = EOK;
+ int ret;
+ uint16_t nitems;
+ int rootdepth;
+ struct ext4_extent_header *hdr;
+ struct ext4_extent *ext;
+ ext4_lblk_t endiblock;
+ ext4_lblk_t startiblock;
+ struct ext4_extent_path *path, *p;
- /* Try to prepend new index to old one */
- if (ext_depth(inode_ref->inode))
- goal = ext4_idx_pblock(
- EXT_FIRST_INDEX(ext_inode_hdr(inode_ref->inode)));
- else
- goal = ext4_fs_inode_to_goal_block(inode_ref);
+ rootdepth = ext4_extent_tree_depth(inode_ref);
- newblock = ext4_new_meta_blocks(inode_ref, goal, flags, NULL, &err);
- if (newblock == 0)
- return err;
+ ret = ext4_extent_find_extent(inode_ref, fromiblock, &path);
+ if (ret != EOK)
+ return ret;
- /* # */
- err = ext4_trans_block_get_noread(inode_ref->fs->bdev, &bh, newblock);
- if (err != EOK) {
- ext4_ext_free_blocks(inode_ref, newblock, 1, 0);
- return err;
- }
+ p = path;
+ hdr = p->header; USED(hdr);
- /* move top-level index/leaf into new block */
- memmove(bh.data, inode_ref->inode->blocks,
- sizeof(inode_ref->inode->blocks));
+ /* We return EOK even if the whole extent tree is empty. */
+ if (!ext4_extent_header_get_nentries(path->header))
+ goto out;
- /* set size of new block */
- neh = ext_block_hdr(&bh);
- /* old root could have indexes or leaves
- * so calculate e_max right way */
- if (ext_depth(inode_ref->inode))
- neh->max_entries_count =
- to_le16(ext4_ext_space_block_idx(inode_ref));
- else
- neh->max_entries_count =
- to_le16(ext4_ext_space_block(inode_ref));
+ /* Calculate the last logical block of the current extent. */
+ ext4_dbg(DEBUG_EXTENT, DBG_INFO "At start of remove_space: \n");
+ ext4_extent_print_path(inode_ref, path);
- neh->magic = to_le16(EXT4_EXTENT_MAGIC);
- ext4_extent_block_csum_set(inode_ref, neh);
+ ext = p->extent;
+ startiblock = ext4_extent_get_iblock(ext);
+ endiblock = startiblock + ext4_extent_get_nblocks(ext) - 1;
- /* Update top-level index: num,max,pointer */
- neh = ext_inode_hdr(inode_ref->inode);
- neh->entries_count = to_le16(1);
- ext4_idx_store_pblock(EXT_FIRST_INDEX(neh), newblock);
- if (neh->depth == 0) {
- /* Root extent block becomes index block */
- neh->max_entries_count =
- to_le16(ext4_ext_space_root_idx(inode_ref));
- EXT_FIRST_INDEX(neh)
- ->first_block = EXT_FIRST_EXTENT(neh)->first_block;
- }
- neh->depth = to_le16(to_le16(neh->depth) + 1);
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Extent: %" PRIu32 ":%" PRIu16 "\n",
+ startiblock, endiblock);
- ext4_trans_set_block_dirty(bh.buf);
- inode_ref->dirty = true;
- ext4_block_set(inode_ref->fs->bdev, &bh);
+ if (fromiblock > endiblock) {
+ bool nonext;
- return err;
-}
+ /* The last logical block of the current extent is smaller
+ * than the first logical block we are going to remove,
+ * thus we increment the extent pointer of the cursor. */
-static inline void ext4_ext_replace_path(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path,
- struct ext4_extent_path *newpath,
- int at)
-{
- ext4_ext_drop_refs(inode_ref, path + at, 1);
- path[at] = *newpath;
- memset(newpath, 0, sizeof(struct ext4_extent_path));
-}
+ /* Increment the extent pointer to point to the
+ * next extent. */
+ ret = ext4_extent_increment(inode_ref, path, &nonext);
+ if (ret != EOK)
+ goto out;
-int ext4_ext_insert_extent(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path **ppath,
- struct ext4_extent *newext, int flags)
-{
- int depth, level = 0, ret;
- struct ext4_extent_path *path = *ppath;
- struct ext4_extent_path *npath = NULL;
- bool ins_right_leaf = false;
- bool need_split;
+ /* The current extent is already the last extent in
+ * the tree, so we just return success here. */
+ if (nonext)
+ goto out;
+ } else if (fromiblock > startiblock) {
+ bool unwritten;
+ uint16_t len;
-again:
- depth = ext_depth(inode_ref->inode);
- ret = ext4_ext_insert_leaf(inode_ref, path, depth, newext, flags,
- &need_split);
- if (ret == EIO && need_split == true) {
- int i;
- for (i = depth, level = 0; i >= 0; i--, level++)
- if (EXT_HAS_FREE_INDEX(path + i))
- break;
+ /* @fromiblock is in the range of the current extent,
+ * but does not sit right on the starting block.
+ *
+ * In this case we need to modify the current extent.
+ * and free some blocks, since we do not really want
+ * to remove and reinsert a new one. */
- /* Do we need to grow the tree? */
- if (i < 0) {
- ret = ext4_ext_grow_indepth(inode_ref, 0);
- if (ret != EOK)
- goto out;
+ len = fromiblock - startiblock;
+ unwritten = EXT4_EXT_IS_UNWRITTEN(ext);
+ ext4_extent_set_nblocks(ext, len, unwritten);
- ret = ext4_find_extent(
- inode_ref, to_le32(newext->first_block), ppath, 0);
- if (ret != EOK)
- goto out;
+ ext4_extent_path_dirty(inode_ref, path, p->depth);
- path = *ppath;
- /*
- * After growing the tree, there should be free space in
- * the only child node of the root.
- */
- level--;
- depth++;
- }
+ /* Free the range of blocks starting from @fromiblock
+ * up to either @endiblock or @toiblock. */
+ if (toiblock < endiblock) {
+ uint16_t flen;
+ ext4_fsblk_t blocknr;
+ struct ext4_extent next;
- i = depth - (level - 1);
- /* We split from leaf to the i-th node */
- if (level > 0) {
- npath = ext4_calloc(1, sizeof(struct ext4_extent_path) *
- (level));
- if (!npath) {
- ret = ENOMEM;
- goto out;
- }
- ret = ext4_ext_split_node(inode_ref, path, i, newext,
- npath, &ins_right_leaf);
- if (ret != EOK)
- goto out;
+ /* In case we free up space inside an extent
+ * while not touching both ends, we need to
+ * unavoidably insert a new extent right after
+ * the modified current extent, and that may
+ * cause tree splitting. */
- while (--level >= 0) {
- if (ins_right_leaf)
- ext4_ext_replace_path(inode_ref, path,
- &npath[level],
- i + level);
- else if (npath[level].block.lb_id)
- ext4_ext_drop_refs(inode_ref,
- npath + level, 1);
- }
- }
- goto again;
- }
+ /* Now we need to free up space first. */
+ flen = toiblock - fromiblock + 1;
+ blocknr = ext4_extent_get_fblock(ext) + len;
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Freeing: %" PRIu64 ":%" PRIu16 "\n",
+ blocknr, flen);
+ ext4_balloc_free_blocks(inode_ref, blocknr, flen);
-out:
- if (ret != EOK) {
- if (path)
- ext4_ext_drop_refs(inode_ref, path, 0);
+ blocknr += flen;
+ startiblock = fromiblock + flen;
+ len = endiblock - startiblock + 1;
- while (--level >= 0 && npath) {
- if (npath[level].block.lb_id) {
- ext4_fsblk_t block = npath[level].block.lb_id;
- ext4_ext_free_blocks(inode_ref, block, 1, 0);
- ext4_ext_drop_refs(inode_ref, npath + level, 1);
- }
- }
- }
- if (npath)
- ext4_free(npath);
+ ext4_extent_set_iblock(&next, startiblock);
+ ext4_extent_set_nblocks(&next, len, unwritten);
+ ext4_extent_set_fblock(&next, blocknr);
+ ret = ext4_extent_insert(inode_ref, path, &next);
- return ret;
-}
+ /* After we free up the space and insert a new
+ * extent, we are done. */
+ goto out;
+ } else {
+ bool nonext;
+ uint16_t flen;
+ ext4_fsblk_t blocknr;
-static void ext4_ext_remove_blocks(struct ext4_inode_ref *inode_ref,
- struct ext4_extent *ex, ext4_lblk_t from,
- ext4_lblk_t to)
-{
- ext4_lblk_t len = to - from + 1;
- ext4_lblk_t num;
- ext4_fsblk_t start;
- num = from - to_le32(ex->first_block);
- start = ext4_ext_pblock(ex) + num;
- ext4_dbg(DEBUG_EXTENT,
- "Freeing %" PRIu32 " at %" PRIu64 ", %" PRIu32 "\n", from,
- start, len);
+ /* Otherwise we do not need any insertion,
+ * which also means that no extra space may be
+ * allocated for tree splitting. */
+ flen = endiblock - fromiblock + 1;
+ blocknr = ext4_extent_get_fblock(ext) + len;
- ext4_ext_free_blocks(inode_ref, start, len, 0);
-}
+ /* Now we need to free up space first. */
+ ext4_dbg(DEBUG_EXTENT,
+ DBG_INFO "Freeing: %" PRIu64 ":%" PRIu16 "\n",
+ blocknr, flen);
+ ext4_balloc_free_blocks(inode_ref, blocknr, flen);
-static int ext4_ext_remove_idx(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path, int32_t depth)
-{
- int err;
- int32_t i = depth;
- ext4_fsblk_t leaf;
-
- /* free index block */
- leaf = ext4_idx_pblock(path[i].index);
-
- if (path[i].index != EXT_LAST_INDEX(path[i].header)) {
- ptrdiff_t len = EXT_LAST_INDEX(path[i].header) - path[i].index;
- memmove(path[i].index, path[i].index + 1,
- len * sizeof(struct ext4_extent_index));
+ /* Increment the extent pointer to point to the
+ * next extent. */
+ ret = ext4_extent_increment(inode_ref, path, &nonext);
+ if (ret != EOK || nonext)
+ goto out;
+ }
}
- path[i].header->entries_count =
- to_le16(to_le16(path[i].header->entries_count) - 1);
- err = ext4_ext_dirty(inode_ref, path + i);
- if (err != EOK)
- return err;
+ while (p <= path + rootdepth) {
+ struct ext4_extent_path *chldp;
- ext4_dbg(DEBUG_EXTENT, "IDX: Freeing %" PRIu32 " at %" PRIu64 ", %d\n",
- to_le32(path[i].index->first_block), leaf, 1);
- ext4_ext_free_blocks(inode_ref, leaf, 1, 0);
+ hdr = p->header;
- /*
- * We may need to correct the paths after the first extents/indexes in
- * a node being modified.
- *
- * We do not need to consider whether there's any extents presenting or
- * not, as garbage will be cleared soon.
- */
- while (i > 0) {
- if (path[i].index != EXT_FIRST_INDEX(path[i].header))
- break;
+ if (!p->depth) {
+ bool stop;
- path[i - 1].index->first_block = path[i].index->first_block;
- err = ext4_ext_dirty(inode_ref, path + i - 1);
- if (err != EOK)
- break;
+ /* Delete as much extents as we can. */
+ ret = ext4_extent_delete_leaf(inode_ref,
+ path,
+ toiblock,
+ &stop);
+ if (ret != EOK)
+ goto out;
- i--;
- }
- return err;
-}
+ if (stop) {
+ /* Since the current extent has its logical
+ * block number greater than @toiblock,
+ * we are done. */
+ break;
+ }
+ /* Since there are no more items in the leaf,
+ * we have to go one level above to switch to the
+ * next leaf. */
+ p++;
+ continue;
+ }
-static int ext4_ext_remove_leaf(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path *path, ext4_lblk_t from,
- ext4_lblk_t to)
-{
+ chldp = p - 1;
+ nitems = ext4_extent_header_get_nentries(chldp->header);
- int32_t depth = ext_depth(inode_ref->inode);
- struct ext4_extent *ex = path[depth].extent;
- struct ext4_extent *start_ex, *ex2 = NULL;
- struct ext4_extent_header *eh = path[depth].header;
- int32_t len;
- int err = EOK;
- uint16_t new_entries;
+ /* Now we don't need the children path anymore. */
+ ext4_block_set(inode_ref->fs->bdev, &chldp->block);
+ if (!nitems) {
+ ret = ext4_extent_delete_node(inode_ref, path, p->depth);
+ if (ret != EOK)
+ goto out;
- start_ex = ex;
- new_entries = to_le16(eh->entries_count);
- while (ex <= EXT_LAST_EXTENT(path[depth].header) &&
- to_le32(ex->first_block) <= to) {
- int32_t new_len = 0;
- int unwritten;
- ext4_lblk_t start, new_start;
- ext4_fsblk_t newblock;
- new_start = start = to_le32(ex->first_block);
- len = ext4_ext_get_actual_len(ex);
- newblock = ext4_ext_pblock(ex);
- /*
- * The 1st case:
- * The position that we start truncation is inside the range of an
- * extent. Here we should calculate the new length of that extent and
- * may start the removal from the next extent.
- */
- if (start < from) {
- len -= from - start;
- new_len = from - start;
- start = from;
- start_ex++;
+ if (p->index > EXT4_EXTENT_LAST_INDEX(hdr)) {
+ /* Go one level above */
+ p++;
+ } else {
+ ret = ext4_extent_reload_paths(inode_ref, path, p->depth, false);
+ if (ret != EOK)
+ goto out;
+ /* Go to the bottom level (aka the leaf). */
+ p = path;
+ }
} else {
- /*
- * The second case:
- * The last block to be truncated is inside the range of an
- * extent. We need to calculate the new length and the new
- * start of the extent.
- */
- if (start + len - 1 > to) {
- new_len = start + len - 1 - to;
- len -= new_len;
- new_start = to + 1;
- newblock += to + 1 - start;
- ex2 = ex;
+ if (p->index == EXT4_EXTENT_LAST_INDEX(hdr)) {
+ /* Go one level above */
+ p++;
+ } else {
+ p->index++;
+ ret = ext4_extent_reload_paths(inode_ref, path, p->depth, false);
+ if (ret != EOK)
+ goto out;
+ /* Go to the bottom level (aka the leaf). */
+ p = path;
}
}
+ }
- ext4_ext_remove_blocks(inode_ref, ex, start, start + len - 1);
- /*
- * Set the first block of the extent if it is presented.
- */
- ex->first_block = to_le32(new_start);
+ /* The above code can only exit in either situations:
+ *
+ * 1. We found that there is no more extents at the right
+ * (p < path)
+ * 2. We found that the next extent has key larger than @toiblock
+ * (p at leaf) */
+ ext4_assert(p == path || p > path + rootdepth);
+ if (p == path) {
+ /* We might have removed the leftmost key in the node,
+ * so we need to update the first key of the right
+ * sibling at every level until we meet a non-leftmost
+ * key. */
+ ext4_extent_update_index(inode_ref, path, true);
+ } else {
+ /* Put loaded blocks. We won't double-release
+ * in this case since the depth of tree will
+ * be reset to 0. */
+ ext4_extent_path_release(inode_ref, path);
- /*
- * If the new length of the current extent we are working on is
- * zero, remove it.
- */
- if (!new_len)
- new_entries--;
- else {
- unwritten = ext4_ext_is_unwritten(ex);
- ex->block_count = to_le16(new_len);
- ext4_ext_store_pblock(ex, newblock);
- if (unwritten)
- ext4_ext_mark_unwritten(ex);
+ hdr = ext4_inode_get_extent_header(inode_ref->inode);
+ if (!ext4_extent_header_get_nentries(hdr)) {
+ /* For empty root we need to make sure that the
+ * depth of the root level is 0. */
+ ext4_extent_header_set_nentries(hdr, 0);
+ ext4_extent_header_set_depth(hdr, 0);
+ inode_ref->dirty = true;
}
-
- ex += 1;
}
- if (ex2 == NULL)
- ex2 = ex;
+out:
+ /* Put loaded blocks */
+ ext4_extent_path_release(inode_ref, path);
- /*
- * Move any remaining extents to the starting position of the node.
- */
- if (ex2 <= EXT_LAST_EXTENT(eh))
- memmove(start_ex, ex2, (EXT_LAST_EXTENT(eh) - ex2 + 1) *
- sizeof(struct ext4_extent));
+ /* Destroy temporary data structure */
+ ext4_free(path);
- eh->entries_count = to_le16(new_entries);
- ext4_ext_dirty(inode_ref, path + depth);
-
- /*
- * If the extent pointer is pointed to the first extent of the node, and
- * there's still extents presenting, we may need to correct the indexes
- * of the paths.
- */
- if (path[depth].extent == EXT_FIRST_EXTENT(eh) && eh->entries_count) {
- err = ext4_ext_correct_indexes(inode_ref, path);
- if (err != EOK)
- return err;
- }
-
- /* if this leaf is free, then we should
- * remove it from index block above */
- if (eh->entries_count == 0 && path[depth].block.lb_id)
- err = ext4_ext_remove_idx(inode_ref, path, depth - 1);
- else if (depth > 0)
- path[depth - 1].index++;
-
- return err;
+ return ret;
}
-/*
- * Check if there's more to remove at a specific level.
- */
-static bool ext4_ext_more_to_rm(struct ext4_extent_path *path, ext4_lblk_t to)
+/**@brief Zero a range of blocks
+ * @param inode_ref I-node
+ * @param fblock starting block number to be zeroed
+ * @param nblocks number of blocks to be zeroed
+ * @return Error code */
+static int ext4_extent_zero_fblocks(struct ext4_inode_ref *inode_ref,
+ ext4_fsblk_t fblock,
+ ext4_lblk_t nblocks)
{
- if (!to_le16(path->header->entries_count))
- return false;
+ int ret = EOK;
+ ext4_lblk_t i;
+ uint32_t blocksz;
- if (path->index > EXT_LAST_INDEX(path->header))
- return false;
+ blocksz = ext4_sb_get_block_size(&inode_ref->fs->sb);
+ for (i = 0; i < nblocks; i++) {
+ struct ext4_block bh = EXT4_BLOCK_ZERO();
+ ret = ext4_trans_block_get_noread(inode_ref->fs->bdev, &bh,
+ fblock + i);
+ if (ret != EOK)
+ break;
- if (to_le32(path->index->first_block) > to)
- return false;
-
- return true;
+ memset(bh.data, 0, blocksz);
+ ext4_trans_set_block_dirty(bh.buf);
+ ret = ext4_block_set(inode_ref->fs->bdev, &bh);
+ if (ret != EOK)
+ break;
+ }
+ return ret;
}
-int ext4_extent_remove_space(struct ext4_inode_ref *inode_ref, ext4_lblk_t from,
- ext4_lblk_t to)
+/**@brief Convert unwritten mapping to written one
+ * @param inode_ref I-node
+ * @param path Path in the extent tree
+ * @param iblock starting logical block to be converted
+ * @param nblocks number of blocks to be converted
+ * @return Error code */
+int ext4_extent_convert_written(struct ext4_inode_ref *inode_ref,
+ struct ext4_extent_path *path,
+ ext4_lblk_t iblock,
+ ext4_lblk_t nblocks)
{
- struct ext4_extent_path *path = NULL;
int ret;
- int32_t depth = ext_depth(inode_ref->inode);
- int32_t i;
+ ext4_lblk_t eiblock;
+ ext4_lblk_t enblocks;
+ ext4_fsblk_t efblock;
+ struct ext4_extent *ext;
- ret = ext4_find_extent(inode_ref, from, &path, 0);
- if (ret != EOK)
- goto out;
+ ext = path[0].extent;
+ ext4_assert(ext);
- if (!path[depth].extent) {
- ret = EOK;
- goto out;
- }
+ eiblock = ext4_extent_get_iblock(ext);
+ enblocks = ext4_extent_get_nblocks(ext);
+ efblock = ext4_extent_get_fblock(ext);
+ ext4_assert(EXT4_EXTENT_IN_RANGE(iblock, eiblock, enblocks));
- bool in_range = IN_RANGE(from, to_le32(path[depth].extent->first_block),
- ext4_ext_get_actual_len(path[depth].extent));
+ /* There are four cases we need to handle */
+ if (iblock == eiblock && nblocks == enblocks) {
+ /* Case 1: the whole extent has to be converted.
+ * This is the simplest scenario. We just need
+ * to mark the extent "written", and zero the
+ * blocks covered by the extent */
+ ret = ext4_extent_zero_fblocks(inode_ref, efblock, enblocks);
+ if (ret != EOK)
+ return ret;
+ EXT4_EXT_SET_WRITTEN(ext);
+ ext4_extent_path_dirty(inode_ref, path, 0);
+ } else if (iblock == eiblock) {
+ /* Case 2: convert the first part of the extent to written
+ * and insert an unwritten extent after that */
+ ext4_lblk_t newiblock;
+ ext4_lblk_t newnblocks;
+ ext4_fsblk_t newfblock;
+ struct ext4_extent insext;
- if (!in_range) {
- ret = EOK;
- goto out;
- }
+ /* The new extent we are going to insert */
+ newiblock = eiblock + nblocks;
+ newnblocks = eiblock + enblocks - newiblock;
+ newfblock = efblock + nblocks;
- /* If we do remove_space inside the range of an extent */
- if ((to_le32(path[depth].extent->first_block) < from) &&
- (to < to_le32(path[depth].extent->first_block) +
- ext4_ext_get_actual_len(path[depth].extent) - 1)) {
+ /* Zero the blocks covered by the first part of the extent */
+ ret = ext4_extent_zero_fblocks(inode_ref,
+ efblock + iblock - eiblock,
+ nblocks);
+ if (ret != EOK)
+ return ret;
- struct ext4_extent *ex = path[depth].extent, newex;
- int unwritten = ext4_ext_is_unwritten(ex);
- ext4_lblk_t ee_block = to_le32(ex->first_block);
- int32_t len = ext4_ext_get_actual_len(ex);
- ext4_fsblk_t newblock = to + 1 - ee_block + ext4_ext_pblock(ex);
+ /* Trim the current extent and convert the extent to written */
+ ext4_extent_set_nblocks(ext, enblocks - nblocks, false);
+ ext4_extent_path_dirty(inode_ref, path, 0);
- ex->block_count = to_le16(from - ee_block);
- if (unwritten)
- ext4_ext_mark_unwritten(ex);
+ /* Insert the new extent */
+ ext4_extent_set_iblock(&insext, newiblock);
+ ext4_extent_set_nblocks(&insext, newnblocks, true);
+ ext4_extent_set_fblock(&insext, newfblock);
+ ret = ext4_extent_insert(inode_ref, path, &insext);
+ if (ret != EOK)
+ /* In case when something happens during insertion
+ * we revert the trimming of the current extent */
+ ext4_extent_set_nblocks(ext, nblocks, true);
+ } else if (iblock + nblocks == eiblock + enblocks) {
+ /* Case 3: convert the second part of the extent to written.
+ * We insert an written extent after the current extent */
+ ext4_lblk_t newiblock;
+ ext4_lblk_t newnblocks;
+ ext4_fsblk_t newfblock;
+ struct ext4_extent insext;
- ext4_ext_dirty(inode_ref, path + depth);
+ /* The new extent we are going to insert */
+ newiblock = iblock;
+ newnblocks = nblocks;
+ newfblock = efblock + iblock - eiblock;
- newex.first_block = to_le32(to + 1);
- newex.block_count = to_le16(ee_block + len - 1 - to);
- ext4_ext_store_pblock(&newex, newblock);
- if (unwritten)
- ext4_ext_mark_unwritten(&newex);
+ /* Zero the blocks covered by the first part of the extent */
+ ret = ext4_extent_zero_fblocks(inode_ref, newfblock, newnblocks);
+ if (ret != EOK)
+ return ret;
- ret = ext4_ext_insert_extent(inode_ref, &path, &newex, 0);
- goto out;
- }
+ /* Trim the current extent */
+ ext4_extent_set_nblocks(ext, enblocks - nblocks, true);
+ ext4_extent_path_dirty(inode_ref, path, 0);
- i = depth;
- while (i >= 0) {
- if (i == depth) {
- struct ext4_extent_header *eh;
- struct ext4_extent *first_ex, *last_ex;
- ext4_lblk_t leaf_from, leaf_to;
- eh = path[i].header;
- ext4_assert(to_le16(eh->entries_count) > 0);
- first_ex = EXT_FIRST_EXTENT(eh);
- last_ex = EXT_LAST_EXTENT(eh);
- leaf_from = to_le32(first_ex->first_block);
- leaf_to = to_le32(last_ex->first_block) +
- ext4_ext_get_actual_len(last_ex) - 1;
- if (leaf_from < from)
- leaf_from = from;
+ /* Insert the new extent */
+ ext4_extent_set_iblock(&insext, newiblock);
+ ext4_extent_set_nblocks(&insext, newnblocks, false);
+ ext4_extent_set_fblock(&insext, newfblock);
+ ret = ext4_extent_insert(inode_ref, path, &insext);
+ if (ret != EOK)
+ /* In case when something happens during insertion
+ * we revert the trimming of the current extent */
+ ext4_extent_set_nblocks(ext, nblocks, true);
+ } else {
+ /* Case 4: convert the middle part of the extent to written.
+ * We insert one written extent, follow by an unwritten
+ * extent */
+ ext4_lblk_t newiblock[2];
+ ext4_lblk_t newnblocks[2];
+ ext4_fsblk_t newfblock[2];
+ struct ext4_extent insext;
- if (leaf_to > to)
- leaf_to = to;
+ /* The new extents we are going to insert */
+ newiblock[0] = iblock;
+ newnblocks[0] = nblocks;
+ newfblock[0] = efblock + iblock - eiblock;
+ newiblock[1] = iblock + nblocks;
+ newnblocks[1] = eiblock + enblocks - newiblock[1];
+ newfblock[1] = newfblock[0] + nblocks;
- ext4_ext_remove_leaf(inode_ref, path, leaf_from,
- leaf_to);
- ext4_ext_drop_refs(inode_ref, path + i, 0);
- i--;
- continue;
- }
+ /* Zero the blocks covered by the written extent */
+ ret = ext4_extent_zero_fblocks(inode_ref, newfblock[0],
+ newnblocks[0]);
+ if (ret != EOK)
+ return ret;
- struct ext4_extent_header *eh;
- eh = path[i].header;
- if (ext4_ext_more_to_rm(path + i, to)) {
- struct ext4_block bh = EXT4_BLOCK_ZERO();
- if (path[i + 1].block.lb_id)
- ext4_ext_drop_refs(inode_ref, path + i + 1, 0);
+ /* We don't want to fail in the middle because we
+ * run out of space. From now on the subsequent
+ * insertions cannot fail */
+ ret = ext4_extent_split(inode_ref, path, 2);
+ if (ret != EOK)
+ return ret;
- ret = read_extent_tree_block(
- inode_ref, ext4_idx_pblock(path[i].index),
- depth - i - 1, &bh, 0);
- if (ret != EOK)
- goto out;
+ /* Trim the current extent */
+ ext4_extent_set_nblocks(ext,
+ enblocks - newnblocks[0] - newnblocks[1],
+ true);
+ ext4_extent_path_dirty(inode_ref, path, 0);
- path[i].p_block = ext4_idx_pblock(path[i].index);
- path[i + 1].block = bh;
- path[i + 1].header = ext_block_hdr(&bh);
- path[i + 1].depth = depth - i - 1;
- if (i + 1 == depth)
- path[i + 1].extent =
- EXT_FIRST_EXTENT(path[i + 1].header);
- else
- path[i + 1].index =
- EXT_FIRST_INDEX(path[i + 1].header);
+ /* Insert the written extent first */
+ ext4_extent_set_iblock(&insext, newiblock[0]);
+ ext4_extent_set_nblocks(&insext, newnblocks[0], false);
+ ext4_extent_set_fblock(&insext, newfblock[0]);
+ ret = ext4_extent_insert(inode_ref, path, &insext);
+ ext4_assert(ret == EOK);
- i++;
- } else {
- if (i > 0) {
- /*
- * Garbage entries will finally be cleared here.
- */
- if (!eh->entries_count)
- ret = ext4_ext_remove_idx(inode_ref,
- path, i - 1);
- else
- path[i - 1].index++;
- }
-
- if (i)
- ext4_block_set(inode_ref->fs->bdev,
- &path[i].block);
-
- i--;
- }
+ /* Then insert the unwritten extent */
+ ext4_extent_set_iblock(&insext, newiblock[1]);
+ ext4_extent_set_nblocks(&insext , newnblocks[1], true);
+ ext4_extent_set_fblock(&insext, newfblock[1]);
+ ret = ext4_extent_insert(inode_ref, path, &insext);
+ ext4_assert(ret == EOK);
}
-
- /* TODO: flexible tree reduction should be here */
- if (path->header->entries_count == 0) {
- /*
- * truncate to zero freed all the tree,
- * so we need to correct eh_depth
- */
- ext_inode_hdr(inode_ref->inode)->depth = 0;
- ext_inode_hdr(inode_ref->inode)->max_entries_count =
- to_le16(ext4_ext_space_root(inode_ref));
- ret = ext4_ext_dirty(inode_ref, path);
- }
-
-out:
- ext4_ext_drop_refs(inode_ref, path, 0);
- ext4_free(path);
- path = NULL;
return ret;
}
-static int ext4_ext_split_extent_at(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path **ppath,
- ext4_lblk_t split, uint32_t split_flag)
+/**@brief Check if the second extent can be appended to the first extent
+ * @param ext the first extent
+ * @param ext2 the second extent
+ * @return true if the two extents can be merged, otherwise false */
+static bool ext4_extent_can_append(struct ext4_extent *ext,
+ struct ext4_extent *ext2)
{
- struct ext4_extent *ex, newex;
- ext4_fsblk_t newblock;
- ext4_lblk_t ee_block;
- int32_t ee_len;
- int32_t depth = ext_depth(inode_ref->inode);
- int err;
+ bool unwritten;
+ ext4_lblk_t eiblock[2];
+ ext4_lblk_t enblocks[2];
+ ext4_fsblk_t efblock[2];
- ex = (*ppath)[depth].extent;
- ee_block = to_le32(ex->first_block);
- ee_len = ext4_ext_get_actual_len(ex);
- newblock = split - ee_block + ext4_ext_pblock(ex);
+ eiblock[0] = ext4_extent_get_iblock(ext);
+ enblocks[0] = ext4_extent_get_nblocks(ext);
+ efblock[0] = ext4_extent_get_fblock(ext);
+ eiblock[1] = ext4_extent_get_iblock(ext2);
+ enblocks[1] = ext4_extent_get_nblocks(ext2);
+ efblock[1] = ext4_extent_get_fblock(ext2);
- if (split == ee_block) {
- /*
- * case b: block @split is the block that the extent begins with
- * then we just change the state of the extent, and splitting
- * is not needed.
- */
- if (split_flag & EXT4_EXT_MARK_UNWRIT2)
- ext4_ext_mark_unwritten(ex);
- else
- ext4_ext_mark_initialized(ex);
+ /* We can't merge an unwritten extent with a written
+ * extent */
+ if (EXT4_EXT_IS_UNWRITTEN(ext) != EXT4_EXT_IS_UNWRITTEN(ext2))
+ return false;
- err = ext4_ext_dirty(inode_ref, *ppath + depth);
- goto out;
+ unwritten = EXT4_EXT_IS_UNWRITTEN(ext);
+
+ /* Since the starting logical block of the second
+ * extent is greater than that of the first extent,
+ * we check whether we can append the second extent
+ * to the first extent */
+ if (eiblock[0] + enblocks[0] != eiblock[1] ||
+ efblock[0] + enblocks[0] != efblock[1])
+ /* If the two extents are not continuous
+ * in terms of logical block range and
+ * physical block range, we return false */
+ return false;
+
+ /* Check if the total number of blocks of the two extents are
+ * too long.
+ * Note: the maximum length of unwritten extent is shorter than
+ * written extent by one block */
+ if (unwritten) {
+#if CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ if (enblocks[0] + enblocks[1] > 3)
+#else /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ if (enblocks[0] + enblocks[1] > EXT4_EXT_MAX_LEN_UNWRITTEN)
+#endif /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ return false;
+ } else {
+#if CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ if (enblocks[0] + enblocks[1] > 3)
+#else /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ if (enblocks[0] + enblocks[1] > EXT4_EXT_MAX_LEN_WRITTEN)
+#endif /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ return false;
}
- ex->block_count = to_le16(split - ee_block);
- if (split_flag & EXT4_EXT_MARK_UNWRIT1)
- ext4_ext_mark_unwritten(ex);
+ /* The second extent can be appended to the first extent */
+ return true;
+}
- err = ext4_ext_dirty(inode_ref, *ppath + depth);
- if (err != EOK)
- goto out;
+/**@brief Check if the second extent can be prepended to the first extent
+ * @param ext the first extent
+ * @param ext2 the second extent
+ * @return true if the two extents can be merged, otherwise false */
+static bool ext4_extent_can_prepend(struct ext4_extent *ext,
+ struct ext4_extent *ext2)
+{
+ bool unwritten;
+ ext4_lblk_t eiblock[2];
+ ext4_lblk_t enblocks[2];
+ ext4_fsblk_t efblock[2];
- newex.first_block = to_le32(split);
- newex.block_count = to_le16(ee_len - (split - ee_block));
- ext4_ext_store_pblock(&newex, newblock);
- if (split_flag & EXT4_EXT_MARK_UNWRIT2)
- ext4_ext_mark_unwritten(&newex);
- err = ext4_ext_insert_extent(inode_ref, ppath, &newex,
- EXT4_EXT_NO_COMBINE);
- if (err != EOK)
- goto restore_extent_len;
+ eiblock[0] = ext4_extent_get_iblock(ext);
+ enblocks[0] = ext4_extent_get_nblocks(ext);
+ efblock[0] = ext4_extent_get_fblock(ext);
+ eiblock[1] = ext4_extent_get_iblock(ext2);
+ enblocks[1] = ext4_extent_get_nblocks(ext2);
+ efblock[1] = ext4_extent_get_fblock(ext2);
-out:
- return err;
-restore_extent_len:
- ex->block_count = to_le16(ee_len);
- err = ext4_ext_dirty(inode_ref, *ppath + depth);
- return err;
-}
+ /* We can't merge an unwritten extent with a written
+ * extent */
+ if (EXT4_EXT_IS_UNWRITTEN(ext) != EXT4_EXT_IS_UNWRITTEN(ext2))
+ return false;
-static int ext4_ext_convert_to_initialized(struct ext4_inode_ref *inode_ref,
- struct ext4_extent_path **ppath,
- ext4_lblk_t split, uint32_t blocks)
-{
- int32_t depth = ext_depth(inode_ref->inode), err;
- struct ext4_extent *ex = (*ppath)[depth].extent;
+ unwritten = EXT4_EXT_IS_UNWRITTEN(ext);
- ext4_assert(to_le32(ex->first_block) <= split);
+ /* Since the starting logical block of the second
+ * extent is smaller than that of the first extent,
+ * we check whether we can prepend the second extent
+ * to the first extent */
+ if (eiblock[1] + enblocks[1] != eiblock[0] ||
+ efblock[1] + enblocks[1] != efblock[0])
+ /* If the two extents are not continuous
+ * in terms of logical block range and
+ * physical block range, we return false */
+ return false;
- if (split + blocks ==
- to_le32(ex->first_block) + ext4_ext_get_actual_len(ex)) {
- /* split and initialize right part */
- err = ext4_ext_split_extent_at(inode_ref, ppath, split,
- EXT4_EXT_MARK_UNWRIT1);
- } else if (to_le32(ex->first_block) == split) {
- /* split and initialize left part */
- err = ext4_ext_split_extent_at(inode_ref, ppath, split + blocks,
- EXT4_EXT_MARK_UNWRIT2);
+ /* Check if the total number of blocks of the two extents are
+ * too long.
+ * Note: the maximum length of unwritten extent is shorter than
+ * written extent by one block */
+ if (unwritten) {
+#if CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ if (enblocks[0] + enblocks[1] > 3)
+#else /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ if (enblocks[0] + enblocks[1] > EXT4_EXT_MAX_LEN_UNWRITTEN)
+#endif /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ return false;
} else {
- /* split 1 extent to 3 and initialize the 2nd */
- err = ext4_ext_split_extent_at(inode_ref, ppath, split + blocks,
- EXT4_EXT_MARK_UNWRIT1 |
- EXT4_EXT_MARK_UNWRIT2);
- if (err == EOK) {
- err = ext4_ext_split_extent_at(inode_ref, ppath, split,
- EXT4_EXT_MARK_UNWRIT1);
- }
+#if CONFIG_EXTENT_DEBUG_AGGRESSIVE
+ if (enblocks[0] + enblocks[1] > 3)
+#else /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ if (enblocks[0] + enblocks[1] > EXT4_EXT_MAX_LEN_WRITTEN)
+#endif /* CONFIG_EXTENT_DEBUG_AGGRESSIVE */
+ return false;
}
- return err;
+ /* The second extent can be prepended to the first extent */
+ return true;
}
-static ext4_lblk_t ext4_ext_next_allocated_block(struct ext4_extent_path *path)
+/**@brief Allocate multiple number of blocks
+ * @param inode_ref I-node
+ * @param goal physical block allocation hint
+ * @param nblocks number of blocks to be allocated
+ * @param fblockp Output value - starting physical block number
+ * @param nblocksp Output value - the number of blocks allocated
+ * @return Error code */
+static int
+ext4_extent_alloc_datablocks(struct ext4_inode_ref *inode_ref,
+ ext4_fsblk_t goal,
+ ext4_lblk_t nblocks,
+ ext4_fsblk_t *fblockp,
+ ext4_lblk_t *nblocksp)
{
- int32_t depth;
+ int ret = EOK;
+ ext4_lblk_t i;
+ ext4_fsblk_t retfblock;
+ ext4_lblk_t retnblocks = 0;
- depth = path->depth;
+ for (i = 0; i < nblocks; ++i, ++retnblocks) {
+ bool free = false;
- if (depth == 0 && path->extent == NULL)
- return EXT_MAX_BLOCKS;
-
- while (depth >= 0) {
- if (depth == path->depth) {
- /* leaf */
- if (path[depth].extent &&
- path[depth].extent !=
- EXT_LAST_EXTENT(path[depth].header))
- return to_le32(
- path[depth].extent[1].first_block);
+ if (!i) {
+ /* We allocate the first block by using
+ * ext4_balloc_alloc_block() so that we
+ * can pass allocation hint to the block
+ * allocator */
+ ret = ext4_balloc_alloc_block(inode_ref,
+ goal,
+ &retfblock);
+ if (ret == EOK)
+ free = true;
} else {
- /* index */
- if (path[depth].index !=
- EXT_LAST_INDEX(path[depth].header))
- return to_le32(
- path[depth].index[1].first_block);
+ ext4_fsblk_t blockscnt;
+
+ /* Do a check to make sure that we won't look into
+ * a block number larger than the total number of
+ * blocks we have on this filesystem */
+ blockscnt = ext4_sb_get_blocks_cnt(&inode_ref->fs->sb);
+ if (retfblock + i < blockscnt) {
+ ret = ext4_balloc_try_alloc_block(inode_ref,
+ retfblock + i, &free);
+ } else
+ free = false;
}
- depth--;
- }
- return EXT_MAX_BLOCKS;
-}
-
-static int ext4_ext_zero_unwritten_range(struct ext4_inode_ref *inode_ref,
- ext4_fsblk_t block,
- uint32_t blocks_count)
-{
- int err = EOK;
- uint32_t i;
- uint32_t block_size = ext4_sb_get_block_size(&inode_ref->fs->sb);
- for (i = 0; i < blocks_count; i++) {
- struct ext4_block bh = EXT4_BLOCK_ZERO();
- err = ext4_trans_block_get_noread(inode_ref->fs->bdev, &bh,
- block + i);
- if (err != EOK)
+ /* Stop trying on the next block if we encounter errors, or
+ * if there is insufficient space, or if we can't allocate
+ * blocks continuously */
+ if (ret != EOK || !free)
break;
-
- memset(bh.data, 0, block_size);
- ext4_trans_set_block_dirty(bh.buf);
- err = ext4_block_set(inode_ref->fs->bdev, &bh);
- if (err != EOK)
- break;
}
- return err;
-}
-__unused static void print_path(struct ext4_extent_path *path)
-{
- int32_t i = path->depth;
- while (i >= 0) {
-
- ptrdiff_t a =
- (path->extent)
- ? (path->extent - EXT_FIRST_EXTENT(path->header))
- : 0;
- ptrdiff_t b =
- (path->index)
- ? (path->index - EXT_FIRST_INDEX(path->header))
- : 0;
-
- USED(a);
- USED(b);
- ext4_dbg(DEBUG_EXTENT,
- "depth %" PRId32 ", p_block: %" PRIu64 ","
- "p_ext offset: %td, p_idx offset: %td\n",
- i, path->p_block, a, b);
- i--;
- path++;
+ if (ret == EOK) {
+ *fblockp = retfblock;
+ if (nblocksp)
+ *nblocksp = nblocks;
}
+ return ret;
}
-int ext4_extent_get_blocks(struct ext4_inode_ref *inode_ref, ext4_lblk_t iblock,
- uint32_t max_blocks, ext4_fsblk_t *result,
- bool create, uint32_t *blocks_count)
+/**@brief Extent-based blockmap manipulation
+ * @param inode_ref I-node
+ * @param iblock starting logical block of the inode
+ * @param max_nblocks maximum number of blocks to get from/allocate to blockmap
+ * @param resfblockp return physical block address of the first block of an
+ * extent
+ * @param create true if caller wants to insert mapping or convert
+ * unwritten mapping to written one
+ * @param resnblocksp return number of blocks in an extent (must be smaller than
+ * \p max_nblocks)
+ * @return Error code*/
+int ext4_extent_get_blocks(struct ext4_inode_ref *inode_ref,
+ ext4_lblk_t iblock,
+ ext4_lblk_t max_nblocks,
+ ext4_fsblk_t *resfblockp,
+ bool create,
+ ext4_lblk_t *resnblocksp)
{
- struct ext4_extent_path *path = NULL;
- struct ext4_extent newex, *ex;
+ int ret;
+ struct ext4_extent_path *path;
+ struct ext4_extent *ext;
+ struct ext4_extent insext;
+ ext4_lblk_t eiblock;
+ ext4_lblk_t enblocks;
+ ext4_fsblk_t efblock;
+ ext4_fsblk_t resfblock;
+ ext4_lblk_t resnblocks = 0;
ext4_fsblk_t goal;
- int err = EOK;
- int32_t depth;
- uint32_t allocated = 0;
- ext4_lblk_t next;
- ext4_fsblk_t newblock;
- if (result)
- *result = 0;
+ /* Seek to the corresponding extent */
+ ret = ext4_extent_find_extent(inode_ref, iblock, &path);
+ if (ret != EOK)
+ return ret;
- if (blocks_count)
- *blocks_count = 0;
+ ext = path[0].extent;
+ if (ext) {
+ /* The extent tree is not empty */
+ eiblock = ext4_extent_get_iblock(ext);
+ enblocks = ext4_extent_get_nblocks(ext);
+ efblock = ext4_extent_get_fblock(ext);
+ if (EXT4_EXTENT_IN_RANGE(iblock, eiblock, enblocks)) {
+ /* The extent exists and logical block requested falls
+ * into the range of the extent */
+ resfblock = efblock + iblock - eiblock;
+ resnblocks = eiblock + enblocks - iblock;
- /* find extent for this block */
- err = ext4_find_extent(inode_ref, iblock, &path, 0);
- if (err != EOK) {
- path = NULL;
- goto out2;
- }
+ /* Trim the result if it is larger than the maximum
+ * length the caller wants */
+ if (resnblocks > max_nblocks)
+ resnblocks = max_nblocks;
- depth = ext_depth(inode_ref->inode);
-
- /*
- * consistent leaf must not be empty
- * this situations is possible, though, _during_ tree modification
- * this is why assert can't be put in ext4_ext_find_extent()
- */
- ex = path[depth].extent;
- if (ex) {
- ext4_lblk_t ee_block = to_le32(ex->first_block);
- ext4_fsblk_t ee_start = ext4_ext_pblock(ex);
- uint16_t ee_len = ext4_ext_get_actual_len(ex);
- /* if found exent covers block, simple return it */
- if (IN_RANGE(iblock, ee_block, ee_len)) {
- /* number of remain blocks in the extent */
- allocated = ee_len - (iblock - ee_block);
-
- if (!ext4_ext_is_unwritten(ex)) {
- newblock = iblock - ee_block + ee_start;
- goto out;
+ if (EXT4_EXT_IS_UNWRITTEN(ext)) {
+ if (create)
+ /* Convert the extent to written extent
+ * if the extent is unwritten extent */
+ ret = ext4_extent_convert_written(inode_ref,
+ path,
+ iblock,
+ resnblocks);
+ else
+ /* We are not asked to modify the blockmap
+ * so we just return a hole */
+ resfblock = 0;
}
+ goto cleanup;
+ }
+ if (!create) {
+ /* Don't waste time on finding the next extent if we
+ * are not asked to insert mapping, just return a
+ * hole */
+ resfblock = 0;
+ resnblocks = 1;
+ goto cleanup;
+ }
+ if (ext4_extent_get_iblock(ext) < iblock) {
+ /* Since the logical block of current extent is smaller
+ * the requested logical block, we seek to the next
+ * extent to find the maximum number of blocks we can
+ * allocate without hitting the starting logical block
+ * of the next extent */
+ bool nonext;
- if (!create) {
- newblock = 0;
- goto out;
- }
+ /* Go to the next extent */
+ ret = ext4_extent_increment(inode_ref, path, &nonext);
+ if (ret != EOK)
+ goto cleanup;
- uint32_t zero_range;
- zero_range = allocated;
- if (zero_range > max_blocks)
- zero_range = max_blocks;
+ if (!nonext) {
+ /* We successfully reach the next extent */
+ bool noprev;
+ ext4_lblk_t neiblock;
- newblock = iblock - ee_block + ee_start;
- err = ext4_ext_zero_unwritten_range(inode_ref, newblock,
- zero_range);
- if (err != EOK)
- goto out2;
+ ext = path[0].extent;
- err = ext4_ext_convert_to_initialized(
- inode_ref, &path, iblock, zero_range);
- if (err != EOK)
- goto out2;
+ /* The next extent must start at greater logical
+ * block number */
+ ext4_assert(ext4_extent_get_iblock(ext) >
+ iblock);
- goto out;
+ /* Calculate the maximum number of blocks we
+ * can allocate without overlapping with the
+ * next extent */
+ neiblock = ext4_extent_get_iblock(ext);
+ if (max_nblocks > neiblock - iblock)
+ max_nblocks = neiblock - iblock;
+
+ /* Go back to the previous extent */
+ ret = ext4_extent_decrement(inode_ref, path,
+ &noprev);
+ if (ret != EOK)
+ goto cleanup;
+ ext4_assert(!noprev);
+ ext = path[0].extent;
+ }
}
}
- /*
- * requested block isn't allocated yet
- * we couldn't try to create block if create flag is zero
- */
+ /* Return a hole if we are not asked to insert mapping */
if (!create) {
- goto out2;
+ resfblock = 0;
+ resnblocks = 1;
+ goto cleanup;
}
- /* find next allocated block so that we know how many
- * blocks we can allocate without ovelapping next extent */
- next = ext4_ext_next_allocated_block(path);
- allocated = next - iblock;
- if (allocated > max_blocks)
- allocated = max_blocks;
+ /* Multiple data blocks allocation */
+ goal = ext4_extent_data_alloc_goal(inode_ref, path, iblock);
+ ret = ext4_extent_alloc_datablocks(inode_ref, goal, max_nblocks,
+ &resfblock, &max_nblocks);
+ if (ret != EOK)
+ goto cleanup;
- /* allocate new block */
- goal = ext4_ext_find_goal(inode_ref, path, iblock);
- newblock = ext4_new_meta_blocks(inode_ref, goal, 0, &allocated, &err);
- if (!newblock)
- goto out2;
+ ext4_extent_set_iblock(&insext, iblock);
+ ext4_extent_set_nblocks(&insext, max_nblocks, false);
+ ext4_extent_set_fblock(&insext, resfblock);
- /* try to insert new extent into found leaf and return */
- newex.first_block = to_le32(iblock);
- ext4_ext_store_pblock(&newex, newblock);
- newex.block_count = to_le16(allocated);
- err = ext4_ext_insert_extent(inode_ref, &path, &newex, 0);
- if (err != EOK) {
- /* free data blocks we just allocated */
- ext4_ext_free_blocks(inode_ref, ext4_ext_pblock(&newex),
- to_le16(newex.block_count), 0);
- goto out2;
- }
+ if (ext && ext4_extent_can_append(ext, &insext)) {
+ /* Clang won't complain, it's just to make gcc happy */
+ enblocks = ext4_extent_get_nblocks(ext);
- /* previous routine could use block we allocated */
- newblock = ext4_ext_pblock(&newex);
+ /* If we can append this extent to the current extent */
+ ext4_extent_set_nblocks(ext, enblocks + max_nblocks,
+ EXT4_EXT_IS_UNWRITTEN(ext));
-out:
- if (allocated > max_blocks)
- allocated = max_blocks;
+ ext4_extent_path_dirty(inode_ref, path, 0);
+ } else if (ext && ext4_extent_can_prepend(ext, &insext)) {
+ /* Clang won't complain, it's just to make gcc happy */
+ enblocks = ext4_extent_get_nblocks(ext);
- if (result)
- *result = newblock;
+ /* If we can prepend this extent to the current extent */
+ ext4_extent_set_iblock(ext, iblock);
+ ext4_extent_set_nblocks(ext, enblocks + max_nblocks,
+ EXT4_EXT_IS_UNWRITTEN(ext));
+ ext4_extent_set_fblock(ext, resfblock);
- if (blocks_count)
- *blocks_count = allocated;
+ /* If we are working on the first extent in the
+ * first leaf (in case we are actually prepending
+ * mappings) we need to update the index of nodes.
+ *
+ * NOTE: Since we don't seek to the next extent and
+ * try to modify it, prepending should not happen at
+ * any leaves except the first extent of the first leaf */
+ ext4_extent_update_index(inode_ref, path, false);
+ ext4_extent_path_dirty(inode_ref, path, 0);
+ } else {
+ /* Finally, insert a new extent into the extent tree */
+ ret = ext4_extent_insert(inode_ref, path, &insext);
+ if (ret != EOK)
+ ext4_balloc_free_blocks(inode_ref, resfblock,
+ max_nblocks);
+ }
-out2:
- if (path) {
- ext4_ext_drop_refs(inode_ref, path, 0);
- ext4_free(path);
+ resnblocks = max_nblocks;
+
+cleanup:
+ /* Put loaded blocks */
+ ext4_extent_path_release(inode_ref, path);
+
+ /* Destroy temporary data structure */
+ ext4_free(path);
+
+ if (ret == EOK) {
+ if (resfblockp)
+ *resfblockp = resfblock;
+ if (resnblocksp)
+ *resnblocksp = resnblocks;
}
- return err;
+ return ret;
}
-#endif
+
+#endif /* CONFIG_EXTENT_ENABLE */
+
+/**
+ * @}
+ */
--- a/src/ext4_fs.c
+++ b/src/ext4_fs.c
@@ -1231,7 +1231,7 @@
/* Extents require special operation */
if (diff_blocks_cnt) {
r = ext4_extent_remove_space(inode_ref, new_blocks_cnt,
- EXT_MAX_BLOCKS);
+ EXT4_EXTENT_MAX_BLOCKS);
if (r != EOK)
return r;