[PATCH] jffs2: GC deadlock reading a page that is used in jffs2_write_begin()
Kyeong Yoo
Kyeong.Yoo at alliedtelesis.co.nz
Mon Jul 17 14:54:55 PDT 2017
Hi,
Can someone review this and give me any feedback?
This patch is to prevent deadlock in jffs2 GC.
Thanks,
Kyeong
On 04/07/17 16:22, Kyeong Yoo wrote:
> GC task can deadlock in read_cache_page() because it may attempt
> to release a page that is actually allocated by another task in
> jffs2_write_begin().
> The reason is that in jffs2_write_begin() there is a small window
> a cache page is allocated for use but not set Uptodate yet.
>
> This ends up with a deadlock between two tasks:
> 1) A task (e.g. file copy)
> - jffs2_write_begin() locks a cache page
> - jffs2_write_end() tries to lock "alloc_sem" from
> jffs2_reserve_space() <-- STUCK
> 2) GC task (jffs2_gcd_mtd3)
> - jffs2_garbage_collect_pass() locks "alloc_sem"
> - try to lock the same cache page in read_cache_page() <-- STUCK
>
> So to avoid this deadlock, hold "alloc_sem" in jffs2_write_begin()
> while reading data in a cache page.
>
> Signed-off-by: Kyeong Yoo <kyeong.yoo at alliedtelesis.co.nz>
> ---
>
> Note: I'm resending this patch to linux-mtd.
>
> fs/jffs2/file.c | 40 +++++++++++++++++++++++++---------------
> 1 file changed, 25 insertions(+), 15 deletions(-)
>
> diff --git a/fs/jffs2/file.c b/fs/jffs2/file.c
> index c12476e309c6..eb4e4d784d26 100644
> --- a/fs/jffs2/file.c
> +++ b/fs/jffs2/file.c
> @@ -135,20 +135,15 @@ static int jffs2_write_begin(struct file *filp, struct address_space *mapping,
> struct page *pg;
> struct inode *inode = mapping->host;
> struct jffs2_inode_info *f = JFFS2_INODE_INFO(inode);
> + struct jffs2_sb_info *c = JFFS2_SB_INFO(inode->i_sb);
> pgoff_t index = pos >> PAGE_SHIFT;
> uint32_t pageofs = index << PAGE_SHIFT;
> int ret = 0;
>
> - pg = grab_cache_page_write_begin(mapping, index, flags);
> - if (!pg)
> - return -ENOMEM;
> - *pagep = pg;
> -
> jffs2_dbg(1, "%s()\n", __func__);
>
> if (pageofs > inode->i_size) {
> /* Make new hole frag from old EOF to new page */
> - struct jffs2_sb_info *c = JFFS2_SB_INFO(inode->i_sb);
> struct jffs2_raw_inode ri;
> struct jffs2_full_dnode *fn;
> uint32_t alloc_len;
> @@ -159,7 +154,7 @@ static int jffs2_write_begin(struct file *filp, struct address_space *mapping,
> ret = jffs2_reserve_space(c, sizeof(ri), &alloc_len,
> ALLOC_NORMAL, JFFS2_SUMMARY_INODE_SIZE);
> if (ret)
> - goto out_page;
> + goto out_err;
>
> mutex_lock(&f->sem);
> memset(&ri, 0, sizeof(ri));
> @@ -189,7 +184,7 @@ static int jffs2_write_begin(struct file *filp, struct address_space *mapping,
> ret = PTR_ERR(fn);
> jffs2_complete_reservation(c);
> mutex_unlock(&f->sem);
> - goto out_page;
> + goto out_err;
> }
> ret = jffs2_add_full_dnode_to_inode(c, f, fn);
> if (f->metadata) {
> @@ -204,7 +199,7 @@ static int jffs2_write_begin(struct file *filp, struct address_space *mapping,
> jffs2_free_full_dnode(fn);
> jffs2_complete_reservation(c);
> mutex_unlock(&f->sem);
> - goto out_page;
> + goto out_err;
> }
> jffs2_complete_reservation(c);
> inode->i_size = pageofs;
> @@ -212,6 +207,19 @@ static int jffs2_write_begin(struct file *filp, struct address_space *mapping,
> }
>
> /*
> + * While getting a page and reading data in, lock c->alloc_sem until
> + * the page is Uptodate. Otherwise GC task may attempt to read the same
> + * page in read_cache_page(), which causes a deadlock.
> + */
> + mutex_lock(&c->alloc_sem);
> + pg = grab_cache_page_write_begin(mapping, index, flags);
> + if (!pg) {
> + ret = -ENOMEM;
> + goto release_sem;
> + }
> + *pagep = pg;
> +
> + /*
> * Read in the page if it wasn't already present. Cannot optimize away
> * the whole page write case until jffs2_write_end can handle the
> * case of a short-copy.
> @@ -220,15 +228,17 @@ static int jffs2_write_begin(struct file *filp, struct address_space *mapping,
> mutex_lock(&f->sem);
> ret = jffs2_do_readpage_nolock(inode, pg);
> mutex_unlock(&f->sem);
> - if (ret)
> - goto out_page;
> + if (ret) {
> + unlock_page(pg);
> + put_page(pg);
> + goto release_sem;
> + }
> }
> jffs2_dbg(1, "end write_begin(). pg->flags %lx\n", pg->flags);
> - return ret;
>
> -out_page:
> - unlock_page(pg);
> - put_page(pg);
> +release_sem:
> + mutex_unlock(&c->alloc_sem);
> +out_err:
> return ret;
> }
>
>
More information about the linux-mtd
mailing list