Commit 887ff81a authored by Andreas Gruenbacher's avatar Andreas Gruenbacher Committed by Linus Torvalds

[PATCH] ext3/EA: In-inode extended attributes for ext3

This started of as a patch by Alex Tomas <alex@clusterfs.com> and got an
overhaul by me.  The on-disk structure used is the same as in Alex's
original patch.
Signed-off-by: default avatarAndreas Gruenbacher <agruen@suse.de>
Signed-off-by: default avatarAndrew Morton <akpm@osdl.org>
Signed-off-by: default avatarLinus Torvalds <torvalds@osdl.org>
parent 7fada86f
...@@ -596,6 +596,9 @@ struct inode *ext3_new_inode(handle_t *handle, struct inode * dir, int mode) ...@@ -596,6 +596,9 @@ struct inode *ext3_new_inode(handle_t *handle, struct inode * dir, int mode)
spin_unlock(&sbi->s_next_gen_lock); spin_unlock(&sbi->s_next_gen_lock);
ei->i_state = EXT3_STATE_NEW; ei->i_state = EXT3_STATE_NEW;
ei->i_extra_isize =
(EXT3_INODE_SIZE(inode->i_sb) > EXT3_GOOD_OLD_INODE_SIZE) ?
sizeof(struct ext3_inode) - EXT3_GOOD_OLD_INODE_SIZE : 0;
ret = inode; ret = inode;
if(DQUOT_ALLOC_INODE(inode)) { if(DQUOT_ALLOC_INODE(inode)) {
......
...@@ -2385,7 +2385,9 @@ static int __ext3_get_inode_loc(struct inode *inode, ...@@ -2385,7 +2385,9 @@ static int __ext3_get_inode_loc(struct inode *inode,
int ext3_get_inode_loc(struct inode *inode, struct ext3_iloc *iloc) int ext3_get_inode_loc(struct inode *inode, struct ext3_iloc *iloc)
{ {
return __ext3_get_inode_loc(inode, iloc, 1); /* We have all inode data except xattrs in memory here. */
return __ext3_get_inode_loc(inode, iloc,
!(EXT3_I(inode)->i_state & EXT3_STATE_XATTR));
} }
void ext3_set_inode_flags(struct inode *inode) void ext3_set_inode_flags(struct inode *inode)
...@@ -2491,6 +2493,16 @@ void ext3_read_inode(struct inode * inode) ...@@ -2491,6 +2493,16 @@ void ext3_read_inode(struct inode * inode)
ei->i_data[block] = raw_inode->i_block[block]; ei->i_data[block] = raw_inode->i_block[block];
INIT_LIST_HEAD(&ei->i_orphan); INIT_LIST_HEAD(&ei->i_orphan);
ei->i_extra_isize =
(EXT3_INODE_SIZE(inode->i_sb) > EXT3_GOOD_OLD_INODE_SIZE) ?
le16_to_cpu(raw_inode->i_extra_isize) : 0;
if (ei->i_extra_isize) {
__le32 *magic = (void *)raw_inode + EXT3_GOOD_OLD_INODE_SIZE +
ei->i_extra_isize;
if (le32_to_cpu(*magic))
ei->i_state |= EXT3_STATE_XATTR;
}
if (S_ISREG(inode->i_mode)) { if (S_ISREG(inode->i_mode)) {
inode->i_op = &ext3_file_inode_operations; inode->i_op = &ext3_file_inode_operations;
inode->i_fop = &ext3_file_operations; inode->i_fop = &ext3_file_operations;
...@@ -2626,6 +2638,9 @@ static int ext3_do_update_inode(handle_t *handle, ...@@ -2626,6 +2638,9 @@ static int ext3_do_update_inode(handle_t *handle,
} else for (block = 0; block < EXT3_N_BLOCKS; block++) } else for (block = 0; block < EXT3_N_BLOCKS; block++)
raw_inode->i_block[block] = ei->i_data[block]; raw_inode->i_block[block] = ei->i_data[block];
if (EXT3_INODE_SIZE(inode->i_sb) > EXT3_GOOD_OLD_INODE_SIZE)
raw_inode->i_extra_isize = cpu_to_le16(ei->i_extra_isize);
BUFFER_TRACE(bh, "call ext3_journal_dirty_metadata"); BUFFER_TRACE(bh, "call ext3_journal_dirty_metadata");
rc = ext3_journal_dirty_metadata(handle, bh); rc = ext3_journal_dirty_metadata(handle, bh);
if (!err) if (!err)
......
...@@ -9,18 +9,21 @@ ...@@ -9,18 +9,21 @@
* suggestion of Luka Renko <luka.renko@hermes.si>. * suggestion of Luka Renko <luka.renko@hermes.si>.
* xattr consolidation Copyright (c) 2004 James Morris <jmorris@redhat.com>, * xattr consolidation Copyright (c) 2004 James Morris <jmorris@redhat.com>,
* Red Hat Inc. * Red Hat Inc.
* ea-in-inode support by Alex Tomas <alex@clusterfs.com> aka bzzz
* and Andreas Gruenbacher <agruen@suse.de>.
*/ */
/* /*
* Extended attributes are stored on disk blocks allocated outside of * Extended attributes are stored directly in inodes (on file systems with
* any inode. The i_file_acl field is then made to point to this allocated * inodes bigger than 128 bytes) and on additional disk blocks. The i_file_acl
* block. If all extended attributes of an inode are identical, these * field contains the block number if an inode uses an additional block. All
* inodes may share the same extended attribute block. Such situations * attributes must fit in the inode and one additional block. Blocks that
* are automatically detected by keeping a cache of recent attribute block * contain the identical set of attributes may be shared among several inodes.
* numbers and hashes over the block's contents in memory. * Identical blocks are detected by keeping a cache of blocks that have
* recently been accessed.
* *
* * The attributes in inodes and on blocks have a different header; the entries
* Extended attribute block layout: * are stored in the same format:
* *
* +------------------+ * +------------------+
* | header | * | header |
...@@ -34,23 +37,17 @@ ...@@ -34,23 +37,17 @@
* | value 2 | | * | value 2 | |
* +------------------+ * +------------------+
* *
* The block header is followed by multiple entry descriptors. These entry * The header is followed by multiple entry descriptors. Descriptors are
* descriptors are variable in size, and alligned to EXT3_XATTR_PAD * kept sorted. The attribute values are aligned to the end of the block
* byte boundaries. The entry descriptors are sorted by attribute name, * in no specific order.
* so that two extended attribute blocks can be compared efficiently.
*
* Attribute values are aligned to the end of the block, stored in
* no specific order. They are also padded to EXT3_XATTR_PAD byte
* boundaries. No additional gaps are left between them.
* *
* Locking strategy * Locking strategy
* ---------------- * ----------------
* EXT3_I(inode)->i_file_acl is protected by EXT3_I(inode)->xattr_sem. * EXT3_I(inode)->i_file_acl is protected by EXT3_I(inode)->xattr_sem.
* EA blocks are only changed if they are exclusive to an inode, so * EA blocks are only changed if they are exclusive to an inode, so
* holding xattr_sem also means that nothing but the EA block's reference * holding xattr_sem also means that nothing but the EA block's reference
* count will change. Multiple writers to an EA block are synchronized * count can change. Multiple writers to the same block are synchronized
* by the bh lock. No more than a single bh lock is held at any time * by the buffer lock.
* to avoid deadlocks.
*/ */
#include <linux/init.h> #include <linux/init.h>
...@@ -69,6 +66,13 @@ ...@@ -69,6 +66,13 @@
#define BFIRST(bh) ENTRY(BHDR(bh)+1) #define BFIRST(bh) ENTRY(BHDR(bh)+1)
#define IS_LAST_ENTRY(entry) (*(__u32 *)(entry) == 0) #define IS_LAST_ENTRY(entry) (*(__u32 *)(entry) == 0)
#define IHDR(inode, raw_inode) \
((struct ext3_xattr_ibody_header *) \
((void *)raw_inode + \
EXT3_GOOD_OLD_INODE_SIZE + \
EXT3_I(inode)->i_extra_isize))
#define IFIRST(hdr) ((struct ext3_xattr_entry *)((hdr)+1))
#ifdef EXT3_XATTR_DEBUG #ifdef EXT3_XATTR_DEBUG
# define ea_idebug(inode, f...) do { \ # define ea_idebug(inode, f...) do { \
printk(KERN_DEBUG "inode %s:%ld: ", \ printk(KERN_DEBUG "inode %s:%ld: ", \
...@@ -206,19 +210,9 @@ ext3_xattr_find_entry(struct ext3_xattr_entry **pentry, int name_index, ...@@ -206,19 +210,9 @@ ext3_xattr_find_entry(struct ext3_xattr_entry **pentry, int name_index,
return cmp ? -ENODATA : 0; return cmp ? -ENODATA : 0;
} }
/*
* ext3_xattr_get()
*
* Copy an extended attribute into the buffer
* provided, or compute the buffer size required.
* Buffer is NULL to compute the size of the buffer required.
*
* Returns a negative error number on failure, or the number of bytes
* used / required on success.
*/
int int
ext3_xattr_get(struct inode *inode, int name_index, const char *name, ext3_xattr_block_get(struct inode *inode, int name_index, const char *name,
void *buffer, size_t buffer_size) void *buffer, size_t buffer_size)
{ {
struct buffer_head *bh = NULL; struct buffer_head *bh = NULL;
struct ext3_xattr_entry *entry; struct ext3_xattr_entry *entry;
...@@ -228,9 +222,6 @@ ext3_xattr_get(struct inode *inode, int name_index, const char *name, ...@@ -228,9 +222,6 @@ ext3_xattr_get(struct inode *inode, int name_index, const char *name,
ea_idebug(inode, "name=%d.%s, buffer=%p, buffer_size=%ld", ea_idebug(inode, "name=%d.%s, buffer=%p, buffer_size=%ld",
name_index, name, buffer, (long)buffer_size); name_index, name, buffer, (long)buffer_size);
if (name == NULL)
return -EINVAL;
down_read(&EXT3_I(inode)->xattr_sem);
error = -ENODATA; error = -ENODATA;
if (!EXT3_I(inode)->i_file_acl) if (!EXT3_I(inode)->i_file_acl)
goto cleanup; goto cleanup;
...@@ -266,6 +257,75 @@ bad_block: ext3_error(inode->i_sb, __FUNCTION__, ...@@ -266,6 +257,75 @@ bad_block: ext3_error(inode->i_sb, __FUNCTION__,
cleanup: cleanup:
brelse(bh); brelse(bh);
return error;
}
static int
ext3_xattr_ibody_get(struct inode *inode, int name_index, const char *name,
void *buffer, size_t buffer_size)
{
struct ext3_xattr_ibody_header *header;
struct ext3_xattr_entry *entry;
struct ext3_inode *raw_inode;
struct ext3_iloc iloc;
size_t size;
void *end;
int error;
if (EXT3_SB(inode->i_sb)->s_inode_size <= EXT3_GOOD_OLD_INODE_SIZE ||
!(EXT3_I(inode)->i_state & EXT3_STATE_XATTR))
return -ENODATA;
error = ext3_get_inode_loc(inode, &iloc);
if (error)
return error;
raw_inode = ext3_raw_inode(&iloc);
header = IHDR(inode, raw_inode);
entry = IFIRST(header);
end = (void *)raw_inode + EXT3_SB(inode->i_sb)->s_inode_size;
error = ext3_xattr_check_names(entry, end);
if (error)
goto cleanup;
error = ext3_xattr_find_entry(&entry, name_index, name,
end - (void *)entry, 0);
if (error)
goto cleanup;
size = le32_to_cpu(entry->e_value_size);
if (buffer) {
error = -ERANGE;
if (size > buffer_size)
goto cleanup;
memcpy(buffer, (void *)IFIRST(header) +
le16_to_cpu(entry->e_value_offs), size);
}
error = size;
cleanup:
brelse(iloc.bh);
return error;
}
/*
* ext3_xattr_get()
*
* Copy an extended attribute into the buffer
* provided, or compute the buffer size required.
* Buffer is NULL to compute the size of the buffer required.
*
* Returns a negative error number on failure, or the number of bytes
* used / required on success.
*/
int
ext3_xattr_get(struct inode *inode, int name_index, const char *name,
void *buffer, size_t buffer_size)
{
int error;
down_read(&EXT3_I(inode)->xattr_sem);
error = ext3_xattr_ibody_get(inode, name_index, name, buffer,
buffer_size);
if (error == -ENODATA)
error = ext3_xattr_block_get(inode, name_index, name, buffer,
buffer_size);
up_read(&EXT3_I(inode)->xattr_sem); up_read(&EXT3_I(inode)->xattr_sem);
return error; return error;
} }
...@@ -295,18 +355,8 @@ ext3_xattr_list_entries(struct inode *inode, struct ext3_xattr_entry *entry, ...@@ -295,18 +355,8 @@ ext3_xattr_list_entries(struct inode *inode, struct ext3_xattr_entry *entry,
return buffer_size - rest; return buffer_size - rest;
} }
/*
* ext3_xattr_list()
*
* Copy a list of attribute names into the buffer
* provided, or compute the buffer size required.
* Buffer is NULL to compute the size of the buffer required.
*
* Returns a negative error number on failure, or the number of bytes
* used / required on success.
*/
int int
ext3_xattr_list(struct inode *inode, char *buffer, size_t buffer_size) ext3_xattr_block_list(struct inode *inode, char *buffer, size_t buffer_size)
{ {
struct buffer_head *bh = NULL; struct buffer_head *bh = NULL;
int error; int error;
...@@ -314,7 +364,6 @@ ext3_xattr_list(struct inode *inode, char *buffer, size_t buffer_size) ...@@ -314,7 +364,6 @@ ext3_xattr_list(struct inode *inode, char *buffer, size_t buffer_size)
ea_idebug(inode, "buffer=%p, buffer_size=%ld", ea_idebug(inode, "buffer=%p, buffer_size=%ld",
buffer, (long)buffer_size); buffer, (long)buffer_size);
down_read(&EXT3_I(inode)->xattr_sem);
error = 0; error = 0;
if (!EXT3_I(inode)->i_file_acl) if (!EXT3_I(inode)->i_file_acl)
goto cleanup; goto cleanup;
...@@ -337,11 +386,71 @@ ext3_xattr_list(struct inode *inode, char *buffer, size_t buffer_size) ...@@ -337,11 +386,71 @@ ext3_xattr_list(struct inode *inode, char *buffer, size_t buffer_size)
cleanup: cleanup:
brelse(bh); brelse(bh);
up_read(&EXT3_I(inode)->xattr_sem);
return error; return error;
} }
static int
ext3_xattr_ibody_list(struct inode *inode, char *buffer, size_t buffer_size)
{
struct ext3_xattr_ibody_header *header;
struct ext3_inode *raw_inode;
struct ext3_iloc iloc;
void *end;
int error;
if (EXT3_SB(inode->i_sb)->s_inode_size <= EXT3_GOOD_OLD_INODE_SIZE ||
!(EXT3_I(inode)->i_state & EXT3_STATE_XATTR))
return 0;
error = ext3_get_inode_loc(inode, &iloc);
if (error)
return error;
raw_inode = ext3_raw_inode(&iloc);
header = IHDR(inode, raw_inode);
end = (void *)raw_inode + EXT3_SB(inode->i_sb)->s_inode_size;
error = ext3_xattr_check_names(IFIRST(header), end);
if (error)
goto cleanup;
error = ext3_xattr_list_entries(inode, IFIRST(header),
buffer, buffer_size);
cleanup:
brelse(iloc.bh);
return error;
}
/*
* ext3_xattr_list()
*
* Copy a list of attribute names into the buffer
* provided, or compute the buffer size required.
* Buffer is NULL to compute the size of the buffer required.
*
* Returns a negative error number on failure, or the number of bytes
* used / required on success.
*/
int
ext3_xattr_list(struct inode *inode, char *buffer, size_t buffer_size)
{
int i_error, b_error;
down_read(&EXT3_I(inode)->xattr_sem);
i_error = ext3_xattr_ibody_list(inode, buffer, buffer_size);
if (i_error < 0) {
b_error = 0;
} else {
if (buffer) {
buffer += i_error;
buffer_size -= i_error;
}
b_error = ext3_xattr_block_list(inode, buffer, buffer_size);
if (b_error < 0)
i_error = 0;
}
up_read(&EXT3_I(inode)->xattr_sem);
return i_error + b_error;
}
/* /*
* If the EXT3_FEATURE_COMPAT_EXT_ATTR feature of this file system is * If the EXT3_FEATURE_COMPAT_EXT_ATTR feature of this file system is
* not set, set it. * not set, set it.
...@@ -514,175 +623,146 @@ ext3_xattr_set_entry(struct ext3_xattr_info *i, struct ext3_xattr_search *s) ...@@ -514,175 +623,146 @@ ext3_xattr_set_entry(struct ext3_xattr_info *i, struct ext3_xattr_search *s)
return 0; return 0;
} }
/* struct ext3_xattr_block_find {
* ext3_xattr_set_handle() struct ext3_xattr_search s;
* struct buffer_head *bh;
* Create, replace or remove an extended attribute for this inode. Buffer };
* is NULL to remove an existing extended attribute, and non-NULL to
* either replace an existing extended attribute, or create a new extended
* attribute. The flags XATTR_REPLACE and XATTR_CREATE
* specify that an extended attribute must exist and must not exist
* previous to the call, respectively.
*
* Returns 0, or a negative error number on failure.
*/
int int
ext3_xattr_set_handle(handle_t *handle, struct inode *inode, int name_index, ext3_xattr_block_find(struct inode *inode, struct ext3_xattr_info *i,
const char *name, const void *value, size_t value_len, struct ext3_xattr_block_find *bs)
int flags)
{ {
struct super_block *sb = inode->i_sb; struct super_block *sb = inode->i_sb;
struct buffer_head *old_bh = NULL, *new_bh = NULL;
struct ext3_xattr_info i = {
.name_index = name_index,
.name = name,
.value = value,
.value_len = value_len,
};
struct ext3_xattr_search s = {
.not_found = 1,
};
struct mb_cache_entry *ce = NULL;
int error; int error;
#define header ((struct ext3_xattr_header *)(s.base))
/*
* header -- Points either into bh, or to a temporarily
* allocated buffer.
*/
ea_idebug(inode, "name=%d.%s, value=%p, value_len=%ld", ea_idebug(inode, "name=%d.%s, value=%p, value_len=%ld",
name_index, name, value, (long)value_len); i->name_index, i->name, i->value, (long)i->value_len);
if (IS_RDONLY(inode))
return -EROFS;
if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
return -EPERM;
if (i.value == NULL)
i.value_len = 0;
down_write(&EXT3_I(inode)->xattr_sem);
if (EXT3_I(inode)->i_file_acl) { if (EXT3_I(inode)->i_file_acl) {
/* The inode already has an extended attribute block. */ /* The inode already has an extended attribute block. */
old_bh = sb_bread(sb, EXT3_I(inode)->i_file_acl); bs->bh = sb_bread(sb, EXT3_I(inode)->i_file_acl);
error = -EIO; error = -EIO;
if (!old_bh) if (!bs->bh)
goto cleanup; goto cleanup;
ea_bdebug(old_bh, "b_count=%d, refcount=%d", ea_bdebug(bs->bh, "b_count=%d, refcount=%d",
atomic_read(&(old_bh->b_count)), atomic_read(&(bs->bh->b_count)),
le32_to_cpu(BHDR(old_bh)->h_refcount)); le32_to_cpu(BHDR(bs->bh)->h_refcount));
if (ext3_xattr_check_block(old_bh)) { if (ext3_xattr_check_block(bs->bh)) {
bad_block: ext3_error(sb, __FUNCTION__, ext3_error(sb, __FUNCTION__,
"inode %ld: bad block %d", inode->i_ino, "inode %ld: bad block %d", inode->i_ino,
EXT3_I(inode)->i_file_acl); EXT3_I(inode)->i_file_acl);
error = -EIO; error = -EIO;
goto cleanup; goto cleanup;
} }
/* Find the named attribute. */ /* Find the named attribute. */
s.base = BHDR(old_bh); bs->s.base = BHDR(bs->bh);
s.first = BFIRST(old_bh); bs->s.first = BFIRST(bs->bh);
s.end = old_bh->b_data + old_bh->b_size; bs->s.end = bs->bh->b_data + bs->bh->b_size;
s.here = BFIRST(old_bh); bs->s.here = bs->s.first;
error = ext3_xattr_find_entry(&s.here, name_index, name, error = ext3_xattr_find_entry(&bs->s.here, i->name_index,
old_bh->b_size, 1); i->name, bs->bh->b_size, 1);
if (error && error != -ENODATA) if (error && error != -ENODATA)
goto cleanup; goto cleanup;
s.not_found = error; bs->s.not_found = error;
} }
error = 0;
if (s.not_found) { cleanup:
/* Request to remove a nonexistent attribute? */ return error;
error = -ENODATA; }
if (flags & XATTR_REPLACE)
goto cleanup; static int
error = 0; ext3_xattr_block_set(handle_t *handle, struct inode *inode,
if (value == NULL) struct ext3_xattr_info *i,
goto cleanup; struct ext3_xattr_block_find *bs)
} else { {
/* Request to create an existing attribute? */ struct super_block *sb = inode->i_sb;
error = -EEXIST; struct buffer_head *new_bh = NULL;
if (flags & XATTR_CREATE) struct ext3_xattr_search *s = &bs->s;
goto cleanup; struct mb_cache_entry *ce = NULL;
} int error;
if (header) { #define header(x) ((struct ext3_xattr_header *)(x))
/* assert(header == BHDR(old_bh)); */
ce = mb_cache_entry_get(ext3_xattr_cache, old_bh->b_bdev, if (i->value && i->value_len > sb->s_blocksize)
old_bh->b_blocknr); return -ENOSPC;
if (header->h_refcount == cpu_to_le32(1)) { if (s->base) {
ce = mb_cache_entry_get(ext3_xattr_cache, bs->bh->b_bdev,
bs->bh->b_blocknr);
if (header(s->base)->h_refcount == cpu_to_le32(1)) {
if (ce) { if (ce) {
mb_cache_entry_free(ce); mb_cache_entry_free(ce);
ce = NULL; ce = NULL;
} }
ea_bdebug(old_bh, "modifying in-place"); ea_bdebug(bs->bh, "modifying in-place");
error = ext3_journal_get_write_access(handle, old_bh); error = ext3_journal_get_write_access(handle, bs->bh);
if (error) if (error)
goto cleanup; goto cleanup;
lock_buffer(old_bh); lock_buffer(bs->bh);
error = ext3_xattr_set_entry(&i, &s); error = ext3_xattr_set_entry(i, s);
if (!error) { if (!error) {
if (!IS_LAST_ENTRY(s.first)) if (!IS_LAST_ENTRY(s->first))
ext3_xattr_rehash(header, s.here); ext3_xattr_rehash(header(s->base),
ext3_xattr_cache_insert(old_bh); s->here);
ext3_xattr_cache_insert(bs->bh);
} }
unlock_buffer(old_bh); unlock_buffer(bs->bh);
if (error == -EIO) if (error == -EIO)
goto bad_block; goto bad_block;
if (!error && old_bh && header == BHDR(old_bh)) { if (!error)
error = ext3_journal_dirty_metadata(handle, error = ext3_journal_dirty_metadata(handle,
old_bh); bs->bh);
}
if (error) if (error)
goto cleanup; goto cleanup;
goto inserted; goto inserted;
} else { } else {
int offset = (char *)s.here - old_bh->b_data; int offset = (char *)s->here - bs->bh->b_data;
if (ce) { if (ce) {
mb_cache_entry_release(ce); mb_cache_entry_release(ce);
ce = NULL; ce = NULL;
} }
ea_bdebug(old_bh, "cloning"); ea_bdebug(bs->bh, "cloning");
s.base = kmalloc(old_bh->b_size, GFP_KERNEL); s->base = kmalloc(bs->bh->b_size, GFP_KERNEL);
/*assert(header == s.base)*/
error = -ENOMEM; error = -ENOMEM;
if (header == NULL) if (s->base == NULL)
goto cleanup; goto cleanup;
memcpy(header, BHDR(old_bh), old_bh->b_size); memcpy(s->base, BHDR(bs->bh), bs->bh->b_size);
s.first = ENTRY(header+1); s->first = ENTRY(header(s->base)+1);
header->h_refcount = cpu_to_le32(1); header(s->base)->h_refcount = cpu_to_le32(1);
s.here = ENTRY(s.base + offset); s->here = ENTRY(s->base + offset);
s.end = header + old_bh->b_size; s->end = s->base + bs->bh->b_size;
} }
} else { } else {
/* Allocate a buffer where we construct the new block. */ /* Allocate a buffer where we construct the new block. */
s.base = kmalloc(sb->s_blocksize, GFP_KERNEL); s->base = kmalloc(sb->s_blocksize, GFP_KERNEL);
/*assert(header == s.base)*/ /* assert(header == s->base) */
error = -ENOMEM; error = -ENOMEM;
if (header == NULL) if (s->base == NULL)
goto cleanup; goto cleanup;
memset(header, 0, sb->s_blocksize); memset(s->base, 0, sb->s_blocksize);
header->h_magic = cpu_to_le32(EXT3_XATTR_MAGIC); header(s->base)->h_magic = cpu_to_le32(EXT3_XATTR_MAGIC);
header->h_blocks = header->h_refcount = cpu_to_le32(1); header(s->base)->h_blocks = cpu_to_le32(1);
s.first = ENTRY(header+1); header(s->base)->h_refcount = cpu_to_le32(1);
s.here = ENTRY(header+1); s->first = ENTRY(header(s->base)+1);
s.end = (void *)header + sb->s_blocksize; s->here = ENTRY(header(s->base)+1);
s->end = s->base + sb->s_blocksize;
} }
error = ext3_xattr_set_entry(&i, &s); error = ext3_xattr_set_entry(i, s);
if (error == -EIO) if (error == -EIO)
goto bad_block; goto bad_block;
if (error) if (error)
goto cleanup; goto cleanup;
if (!IS_LAST_ENTRY(s.first)) if (!IS_LAST_ENTRY(s->first))
ext3_xattr_rehash(header, s.here); ext3_xattr_rehash(header(s->base), s->here);
inserted: inserted:
if (!IS_LAST_ENTRY(s.first)) { if (!IS_LAST_ENTRY(s->first)) {
new_bh = ext3_xattr_cache_find(inode, header, &ce); new_bh = ext3_xattr_cache_find(inode, header(s->base), &ce);
if (new_bh) { if (new_bh) {
/* We found an identical block in the cache. */ /* We found an identical block in the cache. */
if (new_bh == old_bh) if (new_bh == bs->bh)
ea_bdebug(new_bh, "keeping"); ea_bdebug(new_bh, "keeping");
else { else {
/* The old block is released after updating /* The old block is released after updating
...@@ -690,7 +770,8 @@ bad_block: ext3_error(sb, __FUNCTION__, ...@@ -690,7 +770,8 @@ bad_block: ext3_error(sb, __FUNCTION__,
error = -EDQUOT; error = -EDQUOT;
if (DQUOT_ALLOC_BLOCK(inode, 1)) if (DQUOT_ALLOC_BLOCK(inode, 1))
goto cleanup; goto cleanup;
error = ext3_journal_get_write_access(handle, new_bh); error = ext3_journal_get_write_access(handle,
new_bh);
if (error) if (error)
goto cleanup; goto cleanup;
lock_buffer(new_bh); lock_buffer(new_bh);
...@@ -706,10 +787,10 @@ bad_block: ext3_error(sb, __FUNCTION__, ...@@ -706,10 +787,10 @@ bad_block: ext3_error(sb, __FUNCTION__,
} }
mb_cache_entry_release(ce); mb_cache_entry_release(ce);
ce = NULL; ce = NULL;
} else if (old_bh && header == BHDR(old_bh)) { } else if (bs->bh && s->base == bs->bh->b_data) {
/* We were modifying this block in-place. */ /* We were modifying this block in-place. */
ea_bdebug(old_bh, "keeping this block"); ea_bdebug(bs->bh, "keeping this block");
new_bh = old_bh; new_bh = bs->bh;
get_bh(new_bh); get_bh(new_bh);
} else { } else {
/* We need to allocate a new block */ /* We need to allocate a new block */
...@@ -735,7 +816,7 @@ bad_block: ext3_error(sb, __FUNCTION__, ...@@ -735,7 +816,7 @@ bad_block: ext3_error(sb, __FUNCTION__,
unlock_buffer(new_bh); unlock_buffer(new_bh);
goto getblk_failed; goto getblk_failed;
} }
memcpy(new_bh->b_data, header, new_bh->b_size); memcpy(new_bh->b_data, s->base, new_bh->b_size);
set_buffer_uptodate(new_bh); set_buffer_uptodate(new_bh);
unlock_buffer(new_bh); unlock_buffer(new_bh);
ext3_xattr_cache_insert(new_bh); ext3_xattr_cache_insert(new_bh);
...@@ -748,30 +829,196 @@ bad_block: ext3_error(sb, __FUNCTION__, ...@@ -748,30 +829,196 @@ bad_block: ext3_error(sb, __FUNCTION__,
/* Update the inode. */ /* Update the inode. */
EXT3_I(inode)->i_file_acl = new_bh ? new_bh->b_blocknr : 0; EXT3_I(inode)->i_file_acl = new_bh ? new_bh->b_blocknr : 0;
inode->i_ctime = CURRENT_TIME_SEC;
ext3_mark_inode_dirty(handle, inode);
if (IS_SYNC(inode))
handle->h_sync = 1;
/* Drop the previous xattr block. */ /* Drop the previous xattr block. */
if (old_bh && old_bh != new_bh) if (bs->bh && bs->bh != new_bh)
ext3_xattr_release_block(handle, inode, old_bh); ext3_xattr_release_block(handle, inode, bs->bh);
error = 0; error = 0;
cleanup: cleanup:
if (ce) if (ce)
mb_cache_entry_release(ce); mb_cache_entry_release(ce);
brelse(new_bh); brelse(new_bh);
brelse(old_bh); if (!(bs->bh && s->base == bs->bh->b_data))
if (!(old_bh && header == BHDR(old_bh))) kfree(s->base);
kfree(header);
up_write(&EXT3_I(inode)->xattr_sem);
return error; return error;
bad_block:
ext3_error(inode->i_sb, __FUNCTION__,
"inode %ld: bad block %d", inode->i_ino,
EXT3_I(inode)->i_file_acl);
goto cleanup;
#undef header #undef header
} }
struct ext3_xattr_ibody_find {
struct ext3_xattr_search s;
struct ext3_iloc iloc;
};
int
ext3_xattr_ibody_find(struct inode *inode, struct ext3_xattr_info *i,
struct ext3_xattr_ibody_find *is)
{
struct ext3_xattr_ibody_header *header;
struct ext3_inode *raw_inode;
int error;
if (EXT3_SB(inode->i_sb)->s_inode_size <= EXT3_GOOD_OLD_INODE_SIZE)
return 0;
raw_inode = ext3_raw_inode(&is->iloc);
header = IHDR(inode, raw_inode);
is->s.base = is->s.first = IFIRST(header);
is->s.here = is->s.first;
is->s.end = (void *)raw_inode + EXT3_SB(inode->i_sb)->s_inode_size;
if (EXT3_I(inode)->i_state & EXT3_STATE_XATTR) {
error = ext3_xattr_check_names(IFIRST(header), is->s.end);
if (error)
return error;
/* Find the named attribute. */
error = ext3_xattr_find_entry(&is->s.here, i->name_index,
i->name, is->s.end -
(void *)is->s.base, 0);
if (error && error != -ENODATA)
return error;
is->s.not_found = error;
}
return 0;
}
static int
ext3_xattr_ibody_set(handle_t *handle, struct inode *inode,
struct ext3_xattr_info *i,
struct ext3_xattr_ibody_find *is)
{
struct ext3_xattr_ibody_header *header;
struct ext3_xattr_search *s = &is->s;
int error;
if (EXT3_SB(inode->i_sb)->s_inode_size <= EXT3_GOOD_OLD_INODE_SIZE)
return -ENOSPC;
error = ext3_xattr_set_entry(i, s);
if (error)
return error;
header = IHDR(inode, ext3_raw_inode(&is->iloc));
if (!IS_LAST_ENTRY(s->first)) {
header->h_magic = cpu_to_le32(EXT3_XATTR_MAGIC);
EXT3_I(inode)->i_state |= EXT3_STATE_XATTR;
} else {
header->h_magic = cpu_to_le32(0);
EXT3_I(inode)->i_state &= ~EXT3_STATE_XATTR;
}
return 0;
}
/*
* ext3_xattr_set_handle()
*
* Create, replace or remove an extended attribute for this inode. Buffer
* is NULL to remove an existing extended attribute, and non-NULL to
* either replace an existing extended attribute, or create a new extended
* attribute. The flags XATTR_REPLACE and XATTR_CREATE
* specify that an extended attribute must exist and must not exist
* previous to the call, respectively.
*
* Returns 0, or a negative error number on failure.
*/
int
ext3_xattr_set_handle(handle_t *handle, struct inode *inode, int name_index,
const char *name, const void *value, size_t value_len,
int flags)
{
struct ext3_xattr_info i = {
.name_index = name_index,
.name = name,
.value = value,
.value_len = value_len,
};
struct ext3_xattr_ibody_find is = {
.s = { .not_found = -ENODATA, },
};
struct ext3_xattr_block_find bs = {
.s = { .not_found = -ENODATA, },
};
int error;
if (IS_RDONLY(inode))
return -EROFS;
if (IS_IMMUTABLE(inode) || IS_APPEND(inode))
return -EPERM;
if (!name)
return -EINVAL;
if (strlen(name) > 255)
return -ERANGE;
down_write(&EXT3_I(inode)->xattr_sem);
error = ext3_get_inode_loc(inode, &is.iloc);
if (error)
goto cleanup;
error = ext3_xattr_ibody_find(inode, &i, &is);
if (error)
goto cleanup;
if (is.s.not_found)
error = ext3_xattr_block_find(inode, &i, &bs);
if (error)
goto cleanup;
if (is.s.not_found && bs.s.not_found) {
error = -ENODATA;
if (flags & XATTR_REPLACE)
goto cleanup;
error = 0;
if (!value)
goto cleanup;
} else {
error = -EEXIST;
if (flags & XATTR_CREATE)
goto cleanup;
}
error = ext3_journal_get_write_access(handle, is.iloc.bh);
if (error)
goto cleanup;
if (!value) {
if (!is.s.not_found)
error = ext3_xattr_ibody_set(handle, inode, &i, &is);
else if (!bs.s.not_found)
error = ext3_xattr_block_set(handle, inode, &i, &bs);
} else {
error = ext3_xattr_ibody_set(handle, inode, &i, &is);
if (!error && !bs.s.not_found) {
i.value = NULL;
error = ext3_xattr_block_set(handle, inode, &i, &bs);
} else if (error == -ENOSPC) {
error = ext3_xattr_block_set(handle, inode, &i, &bs);
if (error)
goto cleanup;
if (!is.s.not_found) {
i.value = NULL;
error = ext3_xattr_ibody_set(handle, inode, &i,
&is);
}
}
}
if (!error) {
inode->i_ctime = CURRENT_TIME_SEC;
error = ext3_mark_iloc_dirty(handle, inode, &is.iloc);
/*
* The bh is consumed by ext3_mark_iloc_dirty, even with
* error != 0.
*/
is.iloc.bh = NULL;
if (IS_SYNC(inode))
handle->h_sync = 1;
}
cleanup:
brelse(is.iloc.bh);
brelse(bs.bh);
up_write(&EXT3_I(inode)->xattr_sem);
return error;
}
/* /*
* ext3_xattr_set() * ext3_xattr_set()
* *
......
...@@ -31,6 +31,10 @@ struct ext3_xattr_header { ...@@ -31,6 +31,10 @@ struct ext3_xattr_header {
__u32 h_reserved[4]; /* zero right now */ __u32 h_reserved[4]; /* zero right now */
}; };
struct ext3_xattr_ibody_header {
__le32 h_magic; /* magic number for identification */
};
struct ext3_xattr_entry { struct ext3_xattr_entry {
__u8 e_name_len; /* length of name */ __u8 e_name_len; /* length of name */
__u8 e_name_index; /* attribute name index */ __u8 e_name_index; /* attribute name index */
......
...@@ -195,7 +195,7 @@ struct ext3_group_desc ...@@ -195,7 +195,7 @@ struct ext3_group_desc
*/ */
#define EXT3_STATE_JDATA 0x00000001 /* journaled data exists */ #define EXT3_STATE_JDATA 0x00000001 /* journaled data exists */
#define EXT3_STATE_NEW 0x00000002 /* inode is newly created */ #define EXT3_STATE_NEW 0x00000002 /* inode is newly created */
#define EXT3_STATE_XATTR 0x00000004 /* has in-inode xattrs */
/* Used to pass group descriptor data when online resize is done */ /* Used to pass group descriptor data when online resize is done */
struct ext3_new_group_input { struct ext3_new_group_input {
...@@ -293,6 +293,8 @@ struct ext3_inode { ...@@ -293,6 +293,8 @@ struct ext3_inode {
__u32 m_i_reserved2[2]; __u32 m_i_reserved2[2];
} masix2; } masix2;
} osd2; /* OS dependent 2 */ } osd2; /* OS dependent 2 */
__le16 i_extra_isize;
__le16 i_pad1;
}; };
#define i_size_high i_dir_acl #define i_size_high i_dir_acl
......
...@@ -113,6 +113,9 @@ struct ext3_inode_info { ...@@ -113,6 +113,9 @@ struct ext3_inode_info {
*/ */
loff_t i_disksize; loff_t i_disksize;
/* on-disk additional length */
__u16 i_extra_isize;
/* /*
* truncate_sem is for serialising ext3_truncate() against * truncate_sem is for serialising ext3_truncate() against
* ext3_getblock(). In the 2.4 ext2 design, great chunks of inode's * ext3_getblock(). In the 2.4 ext2 design, great chunks of inode's
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment