e293be
centosplus kernel patch [bug#15216]
e293be
e293be
commit 89da619bc18d79bca5304724c11d4ba3b67ce2c6
e293be
Author: Jiang Biao <jiang.biao2@zte.com.cn>
e293be
Date:   Wed Jul 18 10:29:28 2018 +0800
e293be
e293be
    virtio_balloon: fix another race between migration and ballooning
e293be
    
e293be
    Kernel panic when with high memory pressure, calltrace looks like,
e293be
    
e293be
    PID: 21439 TASK: ffff881be3afedd0 CPU: 16 COMMAND: "java"
e293be
     #0 [ffff881ec7ed7630] machine_kexec at ffffffff81059beb
e293be
     #1 [ffff881ec7ed7690] __crash_kexec at ffffffff81105942
e293be
     #2 [ffff881ec7ed7760] crash_kexec at ffffffff81105a30
e293be
     #3 [ffff881ec7ed7778] oops_end at ffffffff816902c8
e293be
     #4 [ffff881ec7ed77a0] no_context at ffffffff8167ff46
e293be
     #5 [ffff881ec7ed77f0] __bad_area_nosemaphore at ffffffff8167ffdc
e293be
     #6 [ffff881ec7ed7838] __node_set at ffffffff81680300
e293be
     #7 [ffff881ec7ed7860] __do_page_fault at ffffffff8169320f
e293be
     #8 [ffff881ec7ed78c0] do_page_fault at ffffffff816932b5
e293be
     #9 [ffff881ec7ed78f0] page_fault at ffffffff8168f4c8
e293be
        [exception RIP: _raw_spin_lock_irqsave+47]
e293be
        RIP: ffffffff8168edef RSP: ffff881ec7ed79a8 RFLAGS: 00010046
e293be
        RAX: 0000000000000246 RBX: ffffea0019740d00 RCX: ffff881ec7ed7fd8
e293be
        RDX: 0000000000020000 RSI: 0000000000000016 RDI: 0000000000000008
e293be
        RBP: ffff881ec7ed79a8 R8: 0000000000000246 R9: 000000000001a098
e293be
        R10: ffff88107ffda000 R11: 0000000000000000 R12: 0000000000000000
e293be
        R13: 0000000000000008 R14: ffff881ec7ed7a80 R15: ffff881be3afedd0
e293be
        ORIG_RAX: ffffffffffffffff CS: 0010 SS: 0018
e293be
    
e293be
    It happens in the pagefault and results in double pagefault
e293be
    during compacting pages when memory allocation fails.
e293be
    
e293be
    Analysed the vmcore, the page leads to second pagefault is corrupted
e293be
    with _mapcount=-256, but private=0.
e293be
    
e293be
    It's caused by the race between migration and ballooning, and lock
e293be
    missing in virtballoon_migratepage() of virtio_balloon driver.
e293be
    This patch fix the bug.
e293be
    
e293be
    Fixes: e22504296d4f64f ("virtio_balloon: introduce migration primitives to balloon pages")
e293be
    Cc: stable@vger.kernel.org
e293be
    Signed-off-by: Jiang Biao <jiang.biao2@zte.com.cn>
e293be
    Signed-off-by: Huang Chong <huang.chong@zte.com.cn>
e293be
    Signed-off-by: Michael S. Tsirkin <mst@redhat.com>
e293be
e293be
    Applied-by: Akemi Yagi <toracat@centos.org>
e293be
e293be
diff --git a/drivers/virtio/virtio_balloon.c b/drivers/virtio/virtio_balloon.c
e293be
index 6b237e3..3988c09 100644
e293be
--- a/drivers/virtio/virtio_balloon.c
e293be
+++ b/drivers/virtio/virtio_balloon.c
e293be
@@ -513,7 +513,9 @@ static int virtballoon_migratepage(struct balloon_dev_info *vb_dev_info,
e293be
 	tell_host(vb, vb->inflate_vq);
e293be
 
e293be
 	/* balloon's page migration 2nd step -- deflate "page" */
e293be
+	spin_lock_irqsave(&vb_dev_info->pages_lock, flags);
e293be
 	balloon_page_delete(page);
e293be
+	spin_unlock_irqrestore(&vb_dev_info->pages_lock, flags);
e293be
 	vb->num_pfns = VIRTIO_BALLOON_PAGES_PER_PAGE;
e293be
 	set_page_pfns(vb, vb->pfns, page);
e293be
 	tell_host(vb, vb->deflate_vq);