bisecting fixing commit since cc4c818b2219c58af5f0ca59f3e9f02c48bc0b65 building syzkaller on cdde748628a830b9236db9890a9fea0764bde4fb testing commit cc4c818b2219c58af5f0ca59f3e9f02c48bc0b65 compiler: gcc version 8.4.1 20210217 (GCC) kernel signature: a1bb834164b2d6b522303c38486ae327d635f78bcc25d23d49bb16afffeb9d40 run #0: crashed: INFO: task hung in do_exit run #1: crashed: INFO: task hung in do_exit run #2: crashed: INFO: task hung in do_exit run #3: crashed: INFO: task hung in do_exit run #4: crashed: INFO: task hung in do_exit run #5: crashed: INFO: task hung in do_exit run #6: crashed: INFO: task hung in do_exit run #7: crashed: INFO: task hung in do_exit run #8: crashed: INFO: task hung in do_exit run #9: crashed: INFO: task hung in do_exit run #10: crashed: INFO: task hung in __do_page_fault run #11: crashed: INFO: task hung in do_exit run #12: crashed: INFO: task hung in do_exit run #13: crashed: INFO: task hung in do_exit run #14: crashed: INFO: task hung in do_exit run #15: crashed: INFO: task hung in do_exit run #16: crashed: INFO: task hung in do_exit run #17: crashed: INFO: task hung in do_exit run #18: crashed: INFO: task hung in do_exit run #19: crashed: INFO: task hung in do_exit testing current HEAD b172b44fcb1771e083aad806fa96f3f60e2ddfac testing commit b172b44fcb1771e083aad806fa96f3f60e2ddfac compiler: gcc version 8.4.1 20210217 (GCC) kernel signature: d5f71a9ee6cba9bfb4ec3bff03200169de771db80172532cb2e4c937abd48948 all runs: crashed: INFO: task hung in do_exit revisions tested: 2, total time: 32m17.45873712s (build: 16m53.584701878s, test: 14m41.34726136s) the crash still happens on HEAD commit msg: Linux 4.19.206 crash: INFO: task hung in do_exit IPv6: ADDRCONF(NETDEV_UP): hsr0: link is not ready IPv6: ADDRCONF(NETDEV_CHANGE): hsr0: link becomes ready IPv6: ADDRCONF(NETDEV_UP): vxcan1: link is not ready 8021q: adding VLAN 0 to HW filter on device batadv0 INFO: task syz-executor.5:6683 blocked for more than 140 seconds. Not tainted 4.19.206-syzkaller #0 "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message. syz-executor.5 D28168 6683 5661 0x80000004 Call Trace: context_switch kernel/sched/core.c:2828 [inline] __schedule+0xdb5/0x1d40 kernel/sched/core.c:3517 schedule+0x7f/0x1b0 kernel/sched/core.c:3561 __rwsem_down_read_failed_common kernel/locking/rwsem-xadd.c:292 [inline] rwsem_down_read_failed+0x21c/0x3e0 kernel/locking/rwsem-xadd.c:309 call_rwsem_down_read_failed+0x18/0x30 arch/x86/lib/rwsem.S:94 __down_read arch/x86/include/asm/rwsem.h:83 [inline] down_read+0x49/0xb0 kernel/locking/rwsem.c:26 exit_mm kernel/exit.c:512 [inline] do_exit+0x5fc/0x2cf0 kernel/exit.c:857 do_group_exit+0xf4/0x2f0 kernel/exit.c:967 get_signal+0x316/0x19e0 kernel/signal.c:2589 do_signal+0x87/0x1960 arch/x86/kernel/signal.c:799 exit_to_usermode_loop+0x114/0x200 arch/x86/entry/common.c:163 prepare_exit_to_usermode arch/x86/entry/common.c:198 [inline] syscall_return_slowpath arch/x86/entry/common.c:271 [inline] do_syscall_64+0x413/0x4e0 arch/x86/entry/common.c:296 entry_SYSCALL_64_after_hwframe+0x49/0xbe RIP: 0033:0x4610d2 Code: Bad RIP value. RSP: 002b:00007ffd2cd647b8 EFLAGS: 00000246 ORIG_RAX: 0000000000000009 RAX: fffffffffffffffc RBX: 0000000000020022 RCX: 00000000004610d2 RDX: 0000000000000000 RSI: 0000000000021000 RDI: 0000000000000000 RBP: 0000000000000000 R08: 00000000ffffffff R09: 0000000000000000 R10: 0000000000020022 R11: 0000000000000246 R12: 00007ffd2cd64980 R13: 0000000000000006 R14: 0000000000000000 R15: 0000000000022000 INFO: task syz-executor.5:6690 blocked for more than 140 seconds. Not tainted 4.19.206-syzkaller #0 "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message. syz-executor.5 D28200 6690 5661 0x80000004 Call Trace: context_switch kernel/sched/core.c:2828 [inline] __schedule+0xdb5/0x1d40 kernel/sched/core.c:3517 schedule+0x7f/0x1b0 kernel/sched/core.c:3561 __rwsem_down_read_failed_common kernel/locking/rwsem-xadd.c:292 [inline] rwsem_down_read_failed+0x21c/0x3e0 kernel/locking/rwsem-xadd.c:309 call_rwsem_down_read_failed+0x18/0x30 arch/x86/lib/rwsem.S:94 __down_read arch/x86/include/asm/rwsem.h:83 [inline] down_read+0x49/0xb0 kernel/locking/rwsem.c:26 exit_mm kernel/exit.c:512 [inline] do_exit+0x5fc/0x2cf0 kernel/exit.c:857 do_group_exit+0xf4/0x2f0 kernel/exit.c:967 get_signal+0x316/0x19e0 kernel/signal.c:2589 do_signal+0x87/0x1960 arch/x86/kernel/signal.c:799 exit_to_usermode_loop+0x114/0x200 arch/x86/entry/common.c:163 prepare_exit_to_usermode arch/x86/entry/common.c:198 [inline] syscall_return_slowpath arch/x86/entry/common.c:271 [inline] do_syscall_64+0x413/0x4e0 arch/x86/entry/common.c:296 entry_SYSCALL_64_after_hwframe+0x49/0xbe RIP: 0033:0x461089 Code: Bad RIP value. RSP: 002b:00007f20d94f5218 EFLAGS: 00000246 ORIG_RAX: 00000000000000ca RAX: fffffffffffffe00 RBX: 000000000052bf08 RCX: 0000000000461089 RDX: 0000000000000000 RSI: 0000000000000080 RDI: 000000000052bf08 RBP: 000000000052bf00 R08: 0000000000000000 R09: 0000000000000000 R10: 0000000000000000 R11: 0000000000000246 R12: 000000000052bf0c R13: 00007ffd2cd6482f R14: 00007f20d94f5300 R15: 0000000000022000 INFO: task syz-executor.2:6684 blocked for more than 140 seconds. Not tainted 4.19.206-syzkaller #0 "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message. syz-executor.2 D28168 6684 5654 0x80000004 Call Trace: context_switch kernel/sched/core.c:2828 [inline] __schedule+0xdb5/0x1d40 kernel/sched/core.c:3517 schedule+0x7f/0x1b0 kernel/sched/core.c:3561 __rwsem_down_read_failed_common kernel/locking/rwsem-xadd.c:292 [inline] rwsem_down_read_failed+0x21c/0x3e0 kernel/locking/rwsem-xadd.c:309 call_rwsem_down_read_failed+0x18/0x30 arch/x86/lib/rwsem.S:94 __down_read arch/x86/include/asm/rwsem.h:83 [inline] down_read+0x49/0xb0 kernel/locking/rwsem.c:26 exit_mm kernel/exit.c:512 [inline] do_exit+0x5fc/0x2cf0 kernel/exit.c:857 do_group_exit+0xf4/0x2f0 kernel/exit.c:967 get_signal+0x316/0x19e0 kernel/signal.c:2589 do_signal+0x87/0x1960 arch/x86/kernel/signal.c:799 exit_to_usermode_loop+0x114/0x200 arch/x86/entry/common.c:163 prepare_exit_to_usermode arch/x86/entry/common.c:198 [inline] syscall_return_slowpath arch/x86/entry/common.c:271 [inline] do_syscall_64+0x413/0x4e0 arch/x86/entry/common.c:296 entry_SYSCALL_64_after_hwframe+0x49/0xbe RIP: 0033:0x4610d2 Code: Bad RIP value. RSP: 002b:00007ffd3c372948 EFLAGS: 00000246 ORIG_RAX: 0000000000000009 RAX: fffffffffffffffc RBX: 0000000000020022 RCX: 00000000004610d2 RDX: 0000000000000000 RSI: 0000000000021000 RDI: 0000000000000000 RBP: 0000000000000000 R08: 00000000ffffffff R09: 0000000000000000 R10: 0000000000020022 R11: 0000000000000246 R12: 00007ffd3c372b10 R13: 0000000000000006 R14: 0000000000000000 R15: 0000000000022000 INFO: task syz-executor.2:6689 blocked for more than 140 seconds. Not tainted 4.19.206-syzkaller #0 "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message. syz-executor.2 D28200 6689 5654 0x80000004 Call Trace: context_switch kernel/sched/core.c:2828 [inline] __schedule+0xdb5/0x1d40 kernel/sched/core.c:3517 schedule+0x7f/0x1b0 kernel/sched/core.c:3561 __rwsem_down_read_failed_common kernel/locking/rwsem-xadd.c:292 [inline] rwsem_down_read_failed+0x21c/0x3e0 kernel/locking/rwsem-xadd.c:309 call_rwsem_down_read_failed+0x18/0x30 arch/x86/lib/rwsem.S:94 __down_read arch/x86/include/asm/rwsem.h:83 [inline] down_read+0x49/0xb0 kernel/locking/rwsem.c:26 exit_mm kernel/exit.c:512 [inline] do_exit+0x5fc/0x2cf0 kernel/exit.c:857 do_group_exit+0xf4/0x2f0 kernel/exit.c:967 get_signal+0x316/0x19e0 kernel/signal.c:2589 do_signal+0x87/0x1960 arch/x86/kernel/signal.c:799 exit_to_usermode_loop+0x114/0x200 arch/x86/entry/common.c:163 prepare_exit_to_usermode arch/x86/entry/common.c:198 [inline] syscall_return_slowpath arch/x86/entry/common.c:271 [inline] do_syscall_64+0x413/0x4e0 arch/x86/entry/common.c:296 entry_SYSCALL_64_after_hwframe+0x49/0xbe RIP: 0033:0x461089 Code: Bad RIP value. RSP: 002b:00007f22f3109218 EFLAGS: 00000246 ORIG_RAX: 00000000000000ca RAX: fffffffffffffe00 RBX: 000000000052bf08 RCX: 0000000000461089 RDX: 0000000000000000 RSI: 0000000000000080 RDI: 000000000052bf08 RBP: 000000000052bf00 R08: 0000000000000000 R09: 0000000000000000 R10: 0000000000000000 R11: 0000000000000246 R12: 000000000052bf0c R13: 00007ffd3c3729bf R14: 00007f22f3109300 R15: 0000000000022000 INFO: task syz-executor.3:6685 blocked for more than 140 seconds. Not tainted 4.19.206-syzkaller #0 "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message. syz-executor.3 D28168 6685 5656 0x80000004 Call Trace: context_switch kernel/sched/core.c:2828 [inline] __schedule+0xdb5/0x1d40 kernel/sched/core.c:3517 schedule+0x7f/0x1b0 kernel/sched/core.c:3561 __rwsem_down_read_failed_common kernel/locking/rwsem-xadd.c:292 [inline] rwsem_down_read_failed+0x21c/0x3e0 kernel/locking/rwsem-xadd.c:309 call_rwsem_down_read_failed+0x18/0x30 arch/x86/lib/rwsem.S:94 __down_read arch/x86/include/asm/rwsem.h:83 [inline] down_read+0x49/0xb0 kernel/locking/rwsem.c:26 exit_mm kernel/exit.c:512 [inline] do_exit+0x5fc/0x2cf0 kernel/exit.c:857 do_group_exit+0xf4/0x2f0 kernel/exit.c:967 get_signal+0x316/0x19e0 kernel/signal.c:2589 do_signal+0x87/0x1960 arch/x86/kernel/signal.c:799 exit_to_usermode_loop+0x114/0x200 arch/x86/entry/common.c:163 prepare_exit_to_usermode arch/x86/entry/common.c:198 [inline] syscall_return_slowpath arch/x86/entry/common.c:271 [inline] do_syscall_64+0x413/0x4e0 arch/x86/entry/common.c:296 entry_SYSCALL_64_after_hwframe+0x49/0xbe RIP: 0033:0x4610d2 Code: Bad RIP value. RSP: 002b:00007fff7329fff8 EFLAGS: 00000246 ORIG_RAX: 0000000000000009 RAX: fffffffffffffffc RBX: 0000000000020022 RCX: 00000000004610d2 RDX: 0000000000000000 RSI: 0000000000021000 RDI: 0000000000000000 RBP: 0000000000000000 R08: 00000000ffffffff R09: 0000000000000000 R10: 0000000000020022 R11: 0000000000000246 R12: 00007fff732a01c0 R13: 0000000000000006 R14: 0000000000000000 R15: 0000000000022000 INFO: task syz-executor.3:6688 blocked for more than 140 seconds. Not tainted 4.19.206-syzkaller #0 "echo 0 > /proc/sys/kernel/hung_task_timeout_secs" disables this message. syz-executor.3 D28200 6688 5656 0x80000004 Call Trace: context_switch kernel/sched/core.c:2828 [inline] __schedule+0xdb5/0x1d40 kernel/sched/core.c:3517 schedule+0x7f/0x1b0 kernel/sched/core.c:3561 __rwsem_down_read_failed_common kernel/locking/rwsem-xadd.c:292 [inline] rwsem_down_read_failed+0x21c/0x3e0 kernel/locking/rwsem-xadd.c:309 call_rwsem_down_read_failed+0x18/0x30 arch/x86/lib/rwsem.S:94 __down_read arch/x86/include/asm/rwsem.h:83 [inline] down_read+0x49/0xb0 kernel/locking/rwsem.c:26 exit_mm kernel/exit.c:512 [inline] do_exit+0x5fc/0x2cf0 kernel/exit.c:857 do_group_exit+0xf4/0x2f0 kernel/exit.c:967 get_signal+0x316/0x19e0 kernel/signal.c:2589 do_signal+0x87/0x1960 arch/x86/kernel/signal.c:799 exit_to_usermode_loop+0x114/0x200 arch/x86/entry/common.c:163 prepare_exit_to_usermode arch/x86/entry/common.c:198 [inline] syscall_return_slowpath arch/x86/entry/common.c:271 [inline] do_syscall_64+0x413/0x4e0 arch/x86/entry/common.c:296 entry_SYSCALL_64_after_hwframe+0x49/0xbe RIP: 0033:0x461089 Code: Bad RIP value. RSP: 002b:00007f9d49723218 EFLAGS: 00000246 ORIG_RAX: 00000000000000ca RAX: fffffffffffffe00 RBX: 000000000052bf08 RCX: 0000000000461089 RDX: 0000000000000000 RSI: 0000000000000080 RDI: 000000000052bf08 RBP: 000000000052bf00 R08: 0000000000000000 R09: 0000000000000000 R10: 0000000000000000 R11: 0000000000000246 R12: 000000000052bf0c R13: 00007fff732a006f R14: 00007f9d49723300 R15: 0000000000022000 Showing all locks held in the system: 1 lock held by khungtaskd/1047: #0: 000000007f57ea1c (rcu_read_lock){....}, at: debug_show_all_locks+0x5b/0x27a kernel/locking/lockdep.c:4443 1 lock held by in:imklog/5345: #0: 00000000221624f2 (&f->f_pos_lock){+.+.}, at: __fdget_pos+0xa7/0xd0 fs/file.c:767 1 lock held by syz-executor.5/6683: #0: 000000000de726cf (&mm->mmap_sem){++++}, at: exit_mm kernel/exit.c:512 [inline] #0: 000000000de726cf (&mm->mmap_sem){++++}, at: do_exit+0x5fc/0x2cf0 kernel/exit.c:857 1 lock held by syz-executor.5/6690: #0: 000000000de726cf (&mm->mmap_sem){++++}, at: exit_mm kernel/exit.c:512 [inline] #0: 000000000de726cf (&mm->mmap_sem){++++}, at: do_exit+0x5fc/0x2cf0 kernel/exit.c:857 2 locks held by syz-executor.5/6701: 1 lock held by syz-executor.2/6684: #0: 00000000353f5287 (&mm->mmap_sem){++++}, at: exit_mm kernel/exit.c:512 [inline] #0: 00000000353f5287 (&mm->mmap_sem){++++}, at: do_exit+0x5fc/0x2cf0 kernel/exit.c:857 1 lock held by syz-executor.2/6689: #0: 00000000353f5287 (&mm->mmap_sem){++++}, at: exit_mm kernel/exit.c:512 [inline] #0: 00000000353f5287 (&mm->mmap_sem){++++}, at: do_exit+0x5fc/0x2cf0 kernel/exit.c:857 2 locks held by syz-executor.2/6699: 1 lock held by syz-executor.3/6685: #0: 000000003e97b0a8 (&mm->mmap_sem){++++}, at: exit_mm kernel/exit.c:512 [inline] #0: 000000003e97b0a8 (&mm->mmap_sem){++++}, at: do_exit+0x5fc/0x2cf0 kernel/exit.c:857 1 lock held by syz-executor.3/6688: #0: 000000003e97b0a8 (&mm->mmap_sem){++++}, at: exit_mm kernel/exit.c:512 [inline] #0: 000000003e97b0a8 (&mm->mmap_sem){++++}, at: do_exit+0x5fc/0x2cf0 kernel/exit.c:857 2 locks held by syz-executor.3/6698: ============================================= NMI backtrace for cpu 0 CPU: 0 PID: 1047 Comm: khungtaskd Not tainted 4.19.206-syzkaller #0 Hardware name: Google Google Compute Engine/Google Compute Engine, BIOS Google 01/01/2011 Call Trace: __dump_stack lib/dump_stack.c:77 [inline] dump_stack+0x123/0x171 lib/dump_stack.c:118 nmi_cpu_backtrace.cold.4+0x3e/0x76 lib/nmi_backtrace.c:101 nmi_trigger_cpumask_backtrace+0xe6/0x120 lib/nmi_backtrace.c:62 arch_trigger_cpumask_backtrace+0x14/0x20 arch/x86/kernel/apic/hw_nmi.c:38 trigger_all_cpu_backtrace include/linux/nmi.h:146 [inline] check_hung_uninterruptible_tasks kernel/hung_task.c:203 [inline] watchdog+0x5c3/0xb40 kernel/hung_task.c:287 kthread+0x347/0x410 kernel/kthread.c:259 ret_from_fork+0x24/0x30 arch/x86/entry/entry_64.S:415 Sending NMI from CPU 0 to CPUs 1: NMI backtrace for cpu 1 CPU: 1 PID: 823 Comm: kworker/u4:3 Not tainted 4.19.206-syzkaller #0 Hardware name: Google Google Compute Engine/Google Compute Engine, BIOS Google 01/01/2011 Workqueue: bat_events batadv_nc_worker RIP: 0010:debug_lockdep_rcu_enabled.part.3+0x2a/0x60 kernel/rcu/update.c:254 Code: 48 b8 00 00 00 00 00 fc ff df 55 48 89 e5 53 65 48 8b 1c 25 80 ee 01 00 48 8d bb 84 08 00 00 48 89 fa 48 c1 ea 03 0f b6 14 02 <48> 89 f8 83 e0 07 83 c0 03 38 d0 7c 04 84 d2 75 10 8b 93 84 08 00 RSP: 0018:ffff8881f3f67c30 EFLAGS: 00000803 RAX: dffffc0000000000 RBX: ffff8881f3f4a300 RCX: ffffffff81514b41 RDX: 0000000000000000 RSI: 0000000000000000 RDI: ffff8881f3f4ab84 RBP: ffff8881f3f67c38 R08: 0000000000000000 R09: ffffed103ed2473a R10: ffffed103ed2473a R11: ffff8881f69239d3 R12: ffff8881f3f4a300 R13: 0000000000000263 R14: ffffffff88199ba0 R15: dffffc0000000000 FS: 0000000000000000(0000) GS:ffff8881f6900000(0000) knlGS:0000000000000000 CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033 CR2: 00007f01a6c41000 CR3: 000000000806d002 CR4: 00000000001606e0 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000 DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400 Call Trace: debug_lockdep_rcu_enabled+0x77/0x90 kernel/rcu/update.c:253 trace_lock_release include/trace/events/lock.h:58 [inline] lock_release+0x5f2/0x850 kernel/locking/lockdep.c:3926 rcu_lock_release include/linux/rcupdate.h:247 [inline] rcu_read_unlock include/linux/rcupdate.h:681 [inline] batadv_nc_purge_orig_hash net/batman-adv/network-coding.c:423 [inline] batadv_nc_worker+0x191/0x630 net/batman-adv/network-coding.c:730 process_one_work+0x830/0x1670 kernel/workqueue.c:2153 worker_thread+0x85/0xb60 kernel/workqueue.c:2296 kthread+0x347/0x410 kernel/kthread.c:259 ret_from_fork+0x24/0x30 arch/x86/entry/entry_64.S:415 ---------------- Code disassembly (best guess): 0: 48 b8 00 00 00 00 00 movabs $0xdffffc0000000000,%rax 7: fc ff df a: 55 push %rbp b: 48 89 e5 mov %rsp,%rbp e: 53 push %rbx f: 65 48 8b 1c 25 80 ee mov %gs:0x1ee80,%rbx 16: 01 00 18: 48 8d bb 84 08 00 00 lea 0x884(%rbx),%rdi 1f: 48 89 fa mov %rdi,%rdx 22: 48 c1 ea 03 shr $0x3,%rdx 26: 0f b6 14 02 movzbl (%rdx,%rax,1),%edx * 2a: 48 89 f8 mov %rdi,%rax <-- trapping instruction 2d: 83 e0 07 and $0x7,%eax 30: 83 c0 03 add $0x3,%eax 33: 38 d0 cmp %dl,%al 35: 7c 04 jl 0x3b 37: 84 d2 test %dl,%dl 39: 75 10 jne 0x4b 3b: 8b .byte 0x8b 3c: 93 xchg %eax,%ebx 3d: 84 08 test %cl,(%rax)