Commit 2e8fa54e authored by Jan Kara's avatar Jan Kara Committed by Theodore Ts'o

ext4: split extent conversion lists to reserved & unreserved parts

Now that we have extent conversions with reserved transaction, we have
to prevent extent conversions without reserved transaction (from DIO
code) to block these (as that would effectively void any transaction
reservation we did).  So split lists, work items, and work queues to
reserved and unreserved parts.
Reviewed-by: default avatarZheng Liu <wenqing.lz@taobao.com>
Signed-off-by: default avatarJan Kara <jack@suse.cz>
Signed-off-by: default avatar"Theodore Ts'o" <tytso@mit.edu>
parent 6b523df4
...@@ -887,12 +887,22 @@ struct ext4_inode_info { ...@@ -887,12 +887,22 @@ struct ext4_inode_info {
qsize_t i_reserved_quota; qsize_t i_reserved_quota;
#endif #endif
/* completed IOs that might need unwritten extents handling */ /* Lock protecting lists below */
struct list_head i_completed_io_list;
spinlock_t i_completed_io_lock; spinlock_t i_completed_io_lock;
/*
* Completed IOs that need unwritten extents handling and have
* transaction reserved
*/
struct list_head i_rsv_conversion_list;
/*
* Completed IOs that need unwritten extents handling and don't have
* transaction reserved
*/
struct list_head i_unrsv_conversion_list;
atomic_t i_ioend_count; /* Number of outstanding io_end structs */ atomic_t i_ioend_count; /* Number of outstanding io_end structs */
atomic_t i_unwritten; /* Nr. of inflight conversions pending */ atomic_t i_unwritten; /* Nr. of inflight conversions pending */
struct work_struct i_unwritten_work; /* deferred extent conversion */ struct work_struct i_rsv_conversion_work;
struct work_struct i_unrsv_conversion_work;
spinlock_t i_block_reservation_lock; spinlock_t i_block_reservation_lock;
...@@ -1264,8 +1274,10 @@ struct ext4_sb_info { ...@@ -1264,8 +1274,10 @@ struct ext4_sb_info {
struct flex_groups *s_flex_groups; struct flex_groups *s_flex_groups;
ext4_group_t s_flex_groups_allocated; ext4_group_t s_flex_groups_allocated;
/* workqueue for dio unwritten */ /* workqueue for unreserved extent convertions (dio) */
struct workqueue_struct *dio_unwritten_wq; struct workqueue_struct *unrsv_conversion_wq;
/* workqueue for reserved extent conversions (buffered io) */
struct workqueue_struct *rsv_conversion_wq;
/* timer for periodic error stats printing */ /* timer for periodic error stats printing */
struct timer_list s_err_report; struct timer_list s_err_report;
...@@ -2646,7 +2658,8 @@ extern int ext4_put_io_end(ext4_io_end_t *io_end); ...@@ -2646,7 +2658,8 @@ extern int ext4_put_io_end(ext4_io_end_t *io_end);
extern void ext4_put_io_end_defer(ext4_io_end_t *io_end); extern void ext4_put_io_end_defer(ext4_io_end_t *io_end);
extern void ext4_io_submit_init(struct ext4_io_submit *io, extern void ext4_io_submit_init(struct ext4_io_submit *io,
struct writeback_control *wbc); struct writeback_control *wbc);
extern void ext4_end_io_work(struct work_struct *work); extern void ext4_end_io_rsv_work(struct work_struct *work);
extern void ext4_end_io_unrsv_work(struct work_struct *work);
extern void ext4_io_submit(struct ext4_io_submit *io); extern void ext4_io_submit(struct ext4_io_submit *io);
extern int ext4_bio_write_page(struct ext4_io_submit *io, extern int ext4_bio_write_page(struct ext4_io_submit *io,
struct page *page, struct page *page,
......
...@@ -58,8 +58,10 @@ void ext4_ioend_shutdown(struct inode *inode) ...@@ -58,8 +58,10 @@ void ext4_ioend_shutdown(struct inode *inode)
* We need to make sure the work structure is finished being * We need to make sure the work structure is finished being
* used before we let the inode get destroyed. * used before we let the inode get destroyed.
*/ */
if (work_pending(&EXT4_I(inode)->i_unwritten_work)) if (work_pending(&EXT4_I(inode)->i_rsv_conversion_work))
cancel_work_sync(&EXT4_I(inode)->i_unwritten_work); cancel_work_sync(&EXT4_I(inode)->i_rsv_conversion_work);
if (work_pending(&EXT4_I(inode)->i_unrsv_conversion_work))
cancel_work_sync(&EXT4_I(inode)->i_unrsv_conversion_work);
} }
static void ext4_release_io_end(ext4_io_end_t *io_end) static void ext4_release_io_end(ext4_io_end_t *io_end)
...@@ -114,20 +116,17 @@ static int ext4_end_io(ext4_io_end_t *io) ...@@ -114,20 +116,17 @@ static int ext4_end_io(ext4_io_end_t *io)
return ret; return ret;
} }
static void dump_completed_IO(struct inode *inode) static void dump_completed_IO(struct inode *inode, struct list_head *head)
{ {
#ifdef EXT4FS_DEBUG #ifdef EXT4FS_DEBUG
struct list_head *cur, *before, *after; struct list_head *cur, *before, *after;
ext4_io_end_t *io, *io0, *io1; ext4_io_end_t *io, *io0, *io1;
if (list_empty(&EXT4_I(inode)->i_completed_io_list)) { if (list_empty(head))
ext4_debug("inode %lu completed_io list is empty\n",
inode->i_ino);
return; return;
}
ext4_debug("Dump inode %lu completed_io list\n", inode->i_ino); ext4_debug("Dump inode %lu completed io list\n", inode->i_ino);
list_for_each_entry(io, &EXT4_I(inode)->i_completed_io_list, list) { list_for_each_entry(io, head, list) {
cur = &io->list; cur = &io->list;
before = cur->prev; before = cur->prev;
io0 = container_of(before, ext4_io_end_t, list); io0 = container_of(before, ext4_io_end_t, list);
...@@ -148,16 +147,23 @@ static void ext4_add_complete_io(ext4_io_end_t *io_end) ...@@ -148,16 +147,23 @@ static void ext4_add_complete_io(ext4_io_end_t *io_end)
unsigned long flags; unsigned long flags;
BUG_ON(!(io_end->flag & EXT4_IO_END_UNWRITTEN)); BUG_ON(!(io_end->flag & EXT4_IO_END_UNWRITTEN));
wq = EXT4_SB(io_end->inode->i_sb)->dio_unwritten_wq;
spin_lock_irqsave(&ei->i_completed_io_lock, flags); spin_lock_irqsave(&ei->i_completed_io_lock, flags);
if (list_empty(&ei->i_completed_io_list)) if (io_end->handle) {
queue_work(wq, &ei->i_unwritten_work); wq = EXT4_SB(io_end->inode->i_sb)->rsv_conversion_wq;
list_add_tail(&io_end->list, &ei->i_completed_io_list); if (list_empty(&ei->i_rsv_conversion_list))
queue_work(wq, &ei->i_rsv_conversion_work);
list_add_tail(&io_end->list, &ei->i_rsv_conversion_list);
} else {
wq = EXT4_SB(io_end->inode->i_sb)->unrsv_conversion_wq;
if (list_empty(&ei->i_unrsv_conversion_list))
queue_work(wq, &ei->i_unrsv_conversion_work);
list_add_tail(&io_end->list, &ei->i_unrsv_conversion_list);
}
spin_unlock_irqrestore(&ei->i_completed_io_lock, flags); spin_unlock_irqrestore(&ei->i_completed_io_lock, flags);
} }
static int ext4_do_flush_completed_IO(struct inode *inode) static int ext4_do_flush_completed_IO(struct inode *inode,
struct list_head *head)
{ {
ext4_io_end_t *io; ext4_io_end_t *io;
struct list_head unwritten; struct list_head unwritten;
...@@ -166,8 +172,8 @@ static int ext4_do_flush_completed_IO(struct inode *inode) ...@@ -166,8 +172,8 @@ static int ext4_do_flush_completed_IO(struct inode *inode)
int err, ret = 0; int err, ret = 0;
spin_lock_irqsave(&ei->i_completed_io_lock, flags); spin_lock_irqsave(&ei->i_completed_io_lock, flags);
dump_completed_IO(inode); dump_completed_IO(inode, head);
list_replace_init(&ei->i_completed_io_list, &unwritten); list_replace_init(head, &unwritten);
spin_unlock_irqrestore(&ei->i_completed_io_lock, flags); spin_unlock_irqrestore(&ei->i_completed_io_lock, flags);
while (!list_empty(&unwritten)) { while (!list_empty(&unwritten)) {
...@@ -183,21 +189,34 @@ static int ext4_do_flush_completed_IO(struct inode *inode) ...@@ -183,21 +189,34 @@ static int ext4_do_flush_completed_IO(struct inode *inode)
} }
/* /*
* work on completed aio dio IO, to convert unwritten extents to extents * work on completed IO, to convert unwritten extents to extents
*/ */
void ext4_end_io_work(struct work_struct *work) void ext4_end_io_rsv_work(struct work_struct *work)
{ {
struct ext4_inode_info *ei = container_of(work, struct ext4_inode_info, struct ext4_inode_info *ei = container_of(work, struct ext4_inode_info,
i_unwritten_work); i_rsv_conversion_work);
ext4_do_flush_completed_IO(&ei->vfs_inode); ext4_do_flush_completed_IO(&ei->vfs_inode, &ei->i_rsv_conversion_list);
}
void ext4_end_io_unrsv_work(struct work_struct *work)
{
struct ext4_inode_info *ei = container_of(work, struct ext4_inode_info,
i_unrsv_conversion_work);
ext4_do_flush_completed_IO(&ei->vfs_inode, &ei->i_unrsv_conversion_list);
} }
int ext4_flush_unwritten_io(struct inode *inode) int ext4_flush_unwritten_io(struct inode *inode)
{ {
int ret; int ret, err;
WARN_ON_ONCE(!mutex_is_locked(&inode->i_mutex) && WARN_ON_ONCE(!mutex_is_locked(&inode->i_mutex) &&
!(inode->i_state & I_FREEING)); !(inode->i_state & I_FREEING));
ret = ext4_do_flush_completed_IO(inode); ret = ext4_do_flush_completed_IO(inode,
&EXT4_I(inode)->i_rsv_conversion_list);
err = ext4_do_flush_completed_IO(inode,
&EXT4_I(inode)->i_unrsv_conversion_list);
if (!ret)
ret = err;
ext4_unwritten_wait(inode); ext4_unwritten_wait(inode);
return ret; return ret;
} }
......
...@@ -750,8 +750,10 @@ static void ext4_put_super(struct super_block *sb) ...@@ -750,8 +750,10 @@ static void ext4_put_super(struct super_block *sb)
ext4_unregister_li_request(sb); ext4_unregister_li_request(sb);
dquot_disable(sb, -1, DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED); dquot_disable(sb, -1, DQUOT_USAGE_ENABLED | DQUOT_LIMITS_ENABLED);
flush_workqueue(sbi->dio_unwritten_wq); flush_workqueue(sbi->unrsv_conversion_wq);
destroy_workqueue(sbi->dio_unwritten_wq); flush_workqueue(sbi->rsv_conversion_wq);
destroy_workqueue(sbi->unrsv_conversion_wq);
destroy_workqueue(sbi->rsv_conversion_wq);
if (sbi->s_journal) { if (sbi->s_journal) {
err = jbd2_journal_destroy(sbi->s_journal); err = jbd2_journal_destroy(sbi->s_journal);
...@@ -859,13 +861,15 @@ static struct inode *ext4_alloc_inode(struct super_block *sb) ...@@ -859,13 +861,15 @@ static struct inode *ext4_alloc_inode(struct super_block *sb)
ei->i_reserved_quota = 0; ei->i_reserved_quota = 0;
#endif #endif
ei->jinode = NULL; ei->jinode = NULL;
INIT_LIST_HEAD(&ei->i_completed_io_list); INIT_LIST_HEAD(&ei->i_rsv_conversion_list);
INIT_LIST_HEAD(&ei->i_unrsv_conversion_list);
spin_lock_init(&ei->i_completed_io_lock); spin_lock_init(&ei->i_completed_io_lock);
ei->i_sync_tid = 0; ei->i_sync_tid = 0;
ei->i_datasync_tid = 0; ei->i_datasync_tid = 0;
atomic_set(&ei->i_ioend_count, 0); atomic_set(&ei->i_ioend_count, 0);
atomic_set(&ei->i_unwritten, 0); atomic_set(&ei->i_unwritten, 0);
INIT_WORK(&ei->i_unwritten_work, ext4_end_io_work); INIT_WORK(&ei->i_rsv_conversion_work, ext4_end_io_rsv_work);
INIT_WORK(&ei->i_unrsv_conversion_work, ext4_end_io_unrsv_work);
return &ei->vfs_inode; return &ei->vfs_inode;
} }
...@@ -3936,12 +3940,20 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) ...@@ -3936,12 +3940,20 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent)
* The maximum number of concurrent works can be high and * The maximum number of concurrent works can be high and
* concurrency isn't really necessary. Limit it to 1. * concurrency isn't really necessary. Limit it to 1.
*/ */
EXT4_SB(sb)->dio_unwritten_wq = EXT4_SB(sb)->rsv_conversion_wq =
alloc_workqueue("ext4-dio-unwritten", WQ_MEM_RECLAIM | WQ_UNBOUND, 1); alloc_workqueue("ext4-rsv-conversion", WQ_MEM_RECLAIM | WQ_UNBOUND, 1);
if (!EXT4_SB(sb)->dio_unwritten_wq) { if (!EXT4_SB(sb)->rsv_conversion_wq) {
printk(KERN_ERR "EXT4-fs: failed to create DIO workqueue\n"); printk(KERN_ERR "EXT4-fs: failed to create workqueue\n");
ret = -ENOMEM; ret = -ENOMEM;
goto failed_mount_wq; goto failed_mount4;
}
EXT4_SB(sb)->unrsv_conversion_wq =
alloc_workqueue("ext4-unrsv-conversion", WQ_MEM_RECLAIM | WQ_UNBOUND, 1);
if (!EXT4_SB(sb)->unrsv_conversion_wq) {
printk(KERN_ERR "EXT4-fs: failed to create workqueue\n");
ret = -ENOMEM;
goto failed_mount4;
} }
/* /*
...@@ -4095,7 +4107,10 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent) ...@@ -4095,7 +4107,10 @@ static int ext4_fill_super(struct super_block *sb, void *data, int silent)
sb->s_root = NULL; sb->s_root = NULL;
failed_mount4: failed_mount4:
ext4_msg(sb, KERN_ERR, "mount failed"); ext4_msg(sb, KERN_ERR, "mount failed");
destroy_workqueue(EXT4_SB(sb)->dio_unwritten_wq); if (EXT4_SB(sb)->rsv_conversion_wq)
destroy_workqueue(EXT4_SB(sb)->rsv_conversion_wq);
if (EXT4_SB(sb)->unrsv_conversion_wq)
destroy_workqueue(EXT4_SB(sb)->unrsv_conversion_wq);
failed_mount_wq: failed_mount_wq:
if (sbi->s_journal) { if (sbi->s_journal) {
jbd2_journal_destroy(sbi->s_journal); jbd2_journal_destroy(sbi->s_journal);
...@@ -4541,7 +4556,8 @@ static int ext4_sync_fs(struct super_block *sb, int wait) ...@@ -4541,7 +4556,8 @@ static int ext4_sync_fs(struct super_block *sb, int wait)
struct ext4_sb_info *sbi = EXT4_SB(sb); struct ext4_sb_info *sbi = EXT4_SB(sb);
trace_ext4_sync_fs(sb, wait); trace_ext4_sync_fs(sb, wait);
flush_workqueue(sbi->dio_unwritten_wq); flush_workqueue(sbi->rsv_conversion_wq);
flush_workqueue(sbi->unrsv_conversion_wq);
/* /*
* Writeback quota in non-journalled quota case - journalled quota has * Writeback quota in non-journalled quota case - journalled quota has
* no dirty dquots * no dirty dquots
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment