Hey,
until yesterday, everything was working fine. But since today i get weird syslogs like this:
All virtual machines are hanging, nothing is working. I cannot stop them. I cannot start other machines.
I have to reset my server.
After rebooting everything seemes to be fine for some minutes, but then it crashes again.
What do you need to help out?
regards
until yesterday, everything was working fine. But since today i get weird syslogs like this:
Code:
INFO: task kdmflush:965 blocked for more than 120 seconds.
"echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message.
kdmflush D ffff88032ea7bb80 0 965 2 0x00000000
ffff880331a35a50 0000000000000046 0000000300000000 ffff880331a35fd8
0000000000015800 ffff880331a35fd8 ffff8803307344d0 0000000000015800
0000000000015800 0000000000015800 0000000000015800 ffff8803307344d0
Call Trace:
[<ffffffffa00551d3>] wait_barrier+0xb0/0xf5 [raid1]
[<ffffffff8104d827>] ? default_wake_function+0x0/0x14
[<ffffffffa0057639>] make_request+0x17e/0x869 [raid1]
[<ffffffff8103dc47>] ? check_preempt_curr_idle+0x15/0x17
[<ffffffff8104d815>] ? try_to_wake_up+0x2a9/0x2bb
[<ffffffff81042894>] ? update_curr+0xde/0x192
[<ffffffff813a6893>] md_make_request+0xdf/0x1e6
[<ffffffff810d7f47>] ? mempool_alloc_slab+0x16/0x18
[<ffffffff812296fe>] generic_make_request+0x2a4/0x329
[<ffffffff81140ea1>] ? bio_alloc_bioset+0x4d/0xc5
[<ffffffff813b13e4>] __map_bio+0xa0/0xfe
[<ffffffff813b249e>] __split_and_process_bio+0x2a9/0x591
[<ffffffff8106c397>] ? remove_wait_queue+0x4d/0x52
[<ffffffff813b1bc1>] ? dm_wait_for_completion+0xe1/0xf2
[<ffffffff813b28d3>] dm_wq_work+0xef/0x18a
[<ffffffff810683ab>] worker_thread+0x1a9/0x24d
[<ffffffff814b4aad>] ? schedule+0x58f/0x5f4
[<ffffffff813b27e4>] ? dm_wq_work+0x0/0x18a
[<ffffffff8106c0e8>] ? autoremove_wake_function+0x0/0x3d
[<ffffffff81068202>] ? worker_thread+0x0/0x24d
[<ffffffff8106bc00>] kthread+0x82/0x8a
[<ffffffff8100ab24>] kernel_thread_helper+0x4/0x10
[<ffffffff8106bb7e>] ? kthread+0x0/0x8a
[<ffffffff8100ab20>] ? kernel_thread_helper+0x0/0x10
INFO: task kcopyd:970 blocked for more than 120 seconds.
"echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message.
kcopyd D ffff880330e383b0 0 970 2 0x00000000
ffff88032fcf3b00 0000000000000046 0000000000000000 ffff88032fcf3fd8
0000000000015800 ffff88032fcf3fd8 ffff880330e38000 0000000000015800
0000000000015800 0000000000015800 0000000000015800 ffff880330e38000
Call Trace:
[<ffffffff813b7216>] ? vm_get_page+0x0/0x47
[<ffffffff814b4b92>] io_schedule+0x80/0xc6
[<ffffffff813b773a>] dm_io+0x1b3/0x2e1
[<ffffffff813b7216>] ? vm_get_page+0x0/0x47
[<ffffffff813b71b2>] ? vm_next_page+0x0/0x21
[<ffffffff810dace3>] ? free_one_page+0x6d/0x7b
[<ffffffff813be169>] chunk_io+0x88/0xf5
[<ffffffff813be169>] ? chunk_io+0x88/0xf5
[<ffffffff810dbda7>] ? __free_pages+0x24/0x26
[<ffffffff8110af80>] ? __free_slab+0x118/0x125
[<ffffffff813bbcf2>] ? copy_callback+0x0/0x41
[<ffffffff813be288>] area_io+0x26/0x28
[<ffffffff813be492>] persistent_commit_exception+0xbd/0x11f
[<ffffffff810d7f2f>] ? mempool_free_slab+0x17/0x19
[<ffffffff813bbd31>] copy_callback+0x3f/0x41
[<ffffffff813b81cd>] run_complete_job+0x92/0xc3
[<ffffffff813b7efa>] process_jobs+0x2f/0xfa
[<ffffffff813b813b>] ? run_complete_job+0x0/0xc3
[<ffffffff813b7feb>] do_work+0x26/0x54
[<ffffffff810683ab>] worker_thread+0x1a9/0x24d
[<ffffffff814b4aad>] ? schedule+0x58f/0x5f4
[<ffffffff813b7fc5>] ? do_work+0x0/0x54
[<ffffffff8106c0e8>] ? autoremove_wake_function+0x0/0x3d
[<ffffffff81068202>] ? worker_thread+0x0/0x24d
[<ffffffff8106bc00>] kthread+0x82/0x8a
[<ffffffff8100ab24>] kernel_thread_helper+0x4/0x10
[<ffffffff8106bb7e>] ? kthread+0x0/0x8a
[<ffffffff8100ab20>] ? kernel_thread_helper+0x0/0x10
INFO: task kvm:1976 blocked for more than 120 seconds.
"echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message.
kvm D ffff880330b6df70 0 1976 1 0x00000000
ffff880235f778f8 0000000000000086 0000000300000000 ffff880235f77fd8
0000000000015800 ffff880235f77fd8 ffff880330b6dbc0 0000000000015800
0000000000015800 0000000000015800 0000000000015800 ffff880330b6dbc0
Call Trace:
[<ffffffffa00551d3>] wait_barrier+0xb0/0xf5 [raid1]
[<ffffffff8104d827>] ? default_wake_function+0x0/0x14
[<ffffffffa0057639>] make_request+0x17e/0x869 [raid1]
[<ffffffff813b13e4>] ? __map_bio+0xa0/0xfe
[<ffffffff813a6893>] md_make_request+0xdf/0x1e6
[<ffffffff812296fe>] generic_make_request+0x2a4/0x329
[<ffffffff81229862>] submit_bio+0xdf/0xfc
[<ffffffff8102f0e7>] ? default_spin_lock_flags+0x9/0xe
[<ffffffff8114330f>] dio_bio_submit+0x84/0xa9
[<ffffffff81143e89>] __blockdev_direct_IO_newtrunc+0x810/0x9ad
[<ffffffff8114217c>] blkdev_direct_IO+0x57/0x59
[<ffffffff811410e8>] ? blkdev_get_blocks+0x0/0x8f
[<ffffffff810d77cf>] generic_file_aio_read+0xe4/0x5dd
[<ffffffff8102f0e7>] ? default_spin_lock_flags+0x9/0xe
[<ffffffff8111a5b3>] do_sync_read+0xcc/0x112
[<ffffffff810637e1>] ? kill_pid_info+0x3f/0x4c
[<ffffffff811f9e75>] ? security_file_permission+0x16/0x18
[<ffffffff8111b070>] vfs_read+0xad/0x107
[<ffffffff8111b12b>] sys_pread64+0x61/0x82
[<ffffffff81009d32>] system_call_fastpath+0x16/0x1b
INFO: task kvm:1977 blocked for more than 120 seconds.
"echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message.
kvm D ffff8803294e4880 0 1977 1 0x00000000
ffff880235e978f8 0000000000000086 0000000300000000 ffff880235e97fd8
0000000000015800 ffff880235e97fd8 ffff8803294e44d0 0000000000015800
0000000000015800 0000000000015800 0000000000015800 ffff8803294e44d0
Call Trace:
[<ffffffffa00551d3>] wait_barrier+0xb0/0xf5 [raid1]
[<ffffffff8104d827>] ? default_wake_function+0x0/0x14
[<ffffffffa0057639>] make_request+0x17e/0x869 [raid1]
[<ffffffff813b13e4>] ? __map_bio+0xa0/0xfe
[<ffffffff81042894>] ? update_curr+0xde/0x192
[<ffffffff813a6893>] md_make_request+0xdf/0x1e6
[<ffffffff812296fe>] generic_make_request+0x2a4/0x329
[<ffffffff81229862>] submit_bio+0xdf/0xfc
[<ffffffff8102f0e7>] ? default_spin_lock_flags+0x9/0xe
[<ffffffff8114330f>] dio_bio_submit+0x84/0xa9
[<ffffffff81143e89>] __blockdev_direct_IO_newtrunc+0x810/0x9ad
[<ffffffff8114217c>] blkdev_direct_IO+0x57/0x59
[<ffffffff811410e8>] ? blkdev_get_blocks+0x0/0x8f
[<ffffffff810d77cf>] generic_file_aio_read+0xe4/0x5dd
[<ffffffff814b66ce>] ? common_interrupt+0xe/0x13
[<ffffffff8102f0e7>] ? default_spin_lock_flags+0x9/0xe
[<ffffffff8111a5b3>] do_sync_read+0xcc/0x112
[<ffffffff8106379a>] ? group_send_sig_info+0x39/0x41
[<ffffffff810637e1>] ? kill_pid_info+0x3f/0x4c
[<ffffffff811f9e75>] ? security_file_permission+0x16/0x18
[<ffffffff8111b070>] vfs_read+0xad/0x107
[<ffffffff8111b12b>] sys_pread64+0x61/0x82
[<ffffffff81009d32>] system_call_fastpath+0x16/0x1b
INFO: task kvm:1978 blocked for more than 120 seconds.
"echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message.
kvm D ffff8803296ac880 0 1978 1 0x00000000
ffff880235e858f8 0000000000000086 0000000300000000 ffff880235e85fd8
0000000000015800 ffff880235e85fd8 ffff8803296ac4d0 0000000000015800
0000000000015800 0000000000015800 0000000000015800 ffff8803296ac4d0
Call Trace:
[<ffffffffa00551d3>] wait_barrier+0xb0/0xf5 [raid1]
[<ffffffff8104d827>] ? default_wake_function+0x0/0x14
[<ffffffffa0057639>] make_request+0x17e/0x869 [raid1]
[<ffffffff813b13e4>] ? __map_bio+0xa0/0xfe
[<ffffffff814b624a>] ? _raw_spin_lock_irq+0x15/0x19
[<ffffffff813a6893>] md_make_request+0xdf/0x1e6
[<ffffffff812296fe>] generic_make_request+0x2a4/0x329
[<ffffffff81229862>] submit_bio+0xdf/0xfc
[<ffffffff8102f0e7>] ? default_spin_lock_flags+0x9/0xe
[<ffffffff8114330f>] dio_bio_submit+0x84/0xa9
[<ffffffff81143e89>] __blockdev_direct_IO_newtrunc+0x810/0x9ad
[<ffffffff8114217c>] blkdev_direct_IO+0x57/0x59
[<ffffffff811410e8>] ? blkdev_get_blocks+0x0/0x8f
[<ffffffff810d77cf>] generic_file_aio_read+0xe4/0x5dd
[<ffffffff8102f0e7>] ? default_spin_lock_flags+0x9/0xe
[<ffffffff8111a5b3>] do_sync_read+0xcc/0x112
[<ffffffff810637e1>] ? kill_pid_info+0x3f/0x4c
[<ffffffff811f9e75>] ? security_file_permission+0x16/0x18
[<ffffffff8111b070>] vfs_read+0xad/0x107
[<ffffffff8111b12b>] sys_pread64+0x61/0x82
[<ffffffff81009d32>] system_call_fastpath+0x16/0x1b
All virtual machines are hanging, nothing is working. I cannot stop them. I cannot start other machines.
I have to reset my server.
After rebooting everything seemes to be fine for some minutes, but then it crashes again.
What do you need to help out?
regards