<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:38:46 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10852] racer test 1 hangs in locking</title>
                <link>https://jira.whamcloud.com/browse/LU-10852</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;racer test_1 hangs. Looking at the logs at &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/49a29a5e-2f2f-11e8-9e0e-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/49a29a5e-2f2f-11e8-9e0e-52540065bddc&lt;/a&gt;, the last lines in the suite_log are&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Waited 950, rc=3 USER&#160;&#160;&#160;&#160;&#160;&#160; PID %CPU %MEM&#160;&#160;&#160; VSZ&#160;&#160; RSS TTY&#160;&#160;&#160;&#160;&#160; STAT START&#160;&#160; TIME COMMAND
./file_exec.sh: fork: retry: No child processes
./file_exec.sh: fork: retry: No child processes
./file_exec.sh: fork: retry: No child processes
./file_exec.sh: fork: retry: No child processes
./file_exec.sh: fork: retry: No child processes
./file_exec.sh: fork: retry: No child processes
./&#160;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;On the MDS, for MDT1 and MDT3, console logs, we see&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[37477.133999] Lustre: DEBUG MARKER: == racer test 1: racer on clients: trevis-8vm1,trevis-8vm2 DURATION=900 ============================== 22:31:21 (1521783081)
[37538.184449] Lustre: lustre-MDT0001: Client ea0330a2-74e9-672c-10d5-7c42a043d466 (at 10.9.4.82@tcp) reconnecting
[37538.184457] Lustre: Skipped 1 previous similar message
[37538.184519] Lustre: lustre-MDT0001: Connection restored to db24b367-e4c2-8934-3f7e-5f07540bffb1 (at 10.9.4.82@tcp)
[37538.184520] Lustre: Skipped 48 previous similar messages
[37568.843505] Lustre: lustre-MDT0003: Client 6439aead-19f9-dcaa-af11-fb13e38eca3a (at 10.9.4.81@tcp) reconnecting
[37589.728065] LNet: Service thread pid 14633 was inactive for 62.10s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace for debugging purposes:
[37589.728073] Pid: 14633, comm: mdt00_004
[37589.728073]
[37589.728073] Call Trace:
[37589.757797]&#160; [&amp;lt;ffffffff81612a95&amp;gt;] schedule+0x35/0x80
[37589.757802]&#160; [&amp;lt;ffffffff81615851&amp;gt;] schedule_timeout+0x161/0x2d0
[37589.772170]&#160; [&amp;lt;ffffffffa0c76e3e&amp;gt;] ldlm_completion_ast+0x51e/0x860 [ptlrpc]
[37589.772254]&#160; [&amp;lt;ffffffffa0c78e15&amp;gt;] ldlm_cli_enqueue_fini+0x905/0xd80 [ptlrpc]
[37589.772290]&#160; [&amp;lt;ffffffffa0c7b119&amp;gt;] ldlm_cli_enqueue+0x3e9/0x8c0 [ptlrpc]
[37589.772343]&#160; [&amp;lt;ffffffffa12694a2&amp;gt;] osp_md_object_lock+0x142/0x290 [osp]
[37589.772411]&#160; [&amp;lt;ffffffffa0ea58fa&amp;gt;] lod_object_lock+0xda/0x910 [lod]
[37589.772498]&#160; [&amp;lt;ffffffffa1125d3d&amp;gt;] mdt_remote_object_lock_try+0x1dd/0x6e0 [mdt]
[37589.772519]&#160; [&amp;lt;ffffffffa112750b&amp;gt;] mdt_object_lock_internal+0x15b/0x2f0 [mdt]
[37589.772534]&#160; [&amp;lt;ffffffffa11276bb&amp;gt;] mdt_object_lock+0x1b/0x20 [mdt]
[37589.772549]&#160; [&amp;lt;ffffffffa1172a91&amp;gt;] mdt_lock_objects_in_linkea+0x711/0x9f6 [mdt]
[37589.772568]&#160; [&amp;lt;ffffffffa113be6c&amp;gt;] mdt_reint_migrate_internal.isra.39+0x85c/0x1670 [mdt]
[37589.772583]&#160; [&amp;lt;ffffffffa113ce85&amp;gt;] mdt_reint_rename_or_migrate.isra.40+0x205/0x7c0 [mdt]
[37589.772597]&#160; [&amp;lt;ffffffffa1141351&amp;gt;] mdt_reint_rec+0x71/0x1e0 [mdt]
[37589.772610]&#160; [&amp;lt;ffffffffa112259b&amp;gt;] mdt_reint_internal+0x59b/0x960 [mdt]
[37589.772629]&#160; [&amp;lt;ffffffffa112cd31&amp;gt;] mdt_reint+0x61/0x120 [mdt]
[37589.772673]&#160; [&amp;lt;ffffffffa0d0a44a&amp;gt;] tgt_request_handle+0x8ca/0x1330 [ptlrpc]
[37589.772722]&#160; [&amp;lt;ffffffffa0cb38f8&amp;gt;] ptlrpc_server_handle_request+0x258/0xa60 [ptlrpc]
[37589.772771]&#160; [&amp;lt;ffffffffa0cb7780&amp;gt;] ptlrpc_main+0xa40/0x1da0 [ptlrpc]
[37589.773283]&#160; [&amp;lt;ffffffff8109e8b9&amp;gt;] kthread+0xc9/0xe0
[37589.777689]&#160; [&amp;lt;ffffffff81616f45&amp;gt;] ret_from_fork+0x55/0x80
[37589.806205] (null)DWARF2 unwinder stuck at ret_from_fork+0x55/0x80
[37589.806205]
[37589.806206] (null)Leftover inexact backtrace:
[37589.806206]
[37589.806215]&#160; [&amp;lt;ffffffff8109e7f0&amp;gt;] ? kthread+0x0/0xe0
[37589.806215]
[37589.806221] LustreError: dumping log to /tmp/lustre-log.1521783194.14633
[37590.051214] Pid: 14662, comm: mdt00_027
[37590.051221]
[37590.051221] Call Trace:
[37590.051237]&#160; [&amp;lt;ffffffff81612a95&amp;gt;] schedule+0x35/0x80
[37590.051242]&#160; [&amp;lt;ffffffff81615851&amp;gt;] schedule_timeout+0x161/0x2d0
[37590.051464]&#160; [&amp;lt;ffffffffa0c76e3e&amp;gt;] ldlm_completion_ast+0x51e/0x860 [ptlrpc]
[37590.051541]&#160; [&amp;lt;ffffffffa0c78e15&amp;gt;] ldlm_cli_enqueue_fini+0x905/0xd80 [ptlrpc]
[37590.051597]&#160; [&amp;lt;ffffffffa0c7b119&amp;gt;] ldlm_cli_enqueue+0x3e9/0x8c0 [ptlrpc]
[37590.051621]&#160; [&amp;lt;ffffffffa12694a2&amp;gt;] osp_md_object_lock+0x142/0x290 [osp]
[37590.051654]&#160; [&amp;lt;ffffffffa0ea58fa&amp;gt;] lod_object_lock+0xda/0x910 [lod]
[37590.051691]&#160; [&amp;lt;ffffffffa1125d3d&amp;gt;] mdt_remote_object_lock_try+0x1dd/0x6e0 [mdt]
[37590.051714]&#160; [&amp;lt;ffffffffa1126269&amp;gt;] mdt_remote_object_lock+0x29/0x30 [mdt]
[37590.051736]&#160; [&amp;lt;ffffffffa113cf75&amp;gt;] mdt_reint_rename_or_migrate.isra.40+0x2f5/0x7c0 [mdt]
[37590.051766]&#160; [&amp;lt;ffffffffa1141351&amp;gt;] mdt_reint_rec+0x71/0x1e0 [mdt]
[37590.051787]&#160; [&amp;lt;ffffffffa112259b&amp;gt;] mdt_reint_internal+0x59b/0x960 [mdt]
[37590.051817]&#160; [&amp;lt;ffffffffa112cd31&amp;gt;] mdt_reint+0x61/0x120 [mdt]
[37590.051887]&#160; [&amp;lt;ffffffffa0d0a44a&amp;gt;] tgt_request_handle+0x8ca/0x1330 [ptlrpc]
[37590.051954]&#160; [&amp;lt;ffffffffa0cb38f8&amp;gt;] ptlrpc_server_handle_request+0x258/0xa60 [ptlrpc]
[37590.052044]&#160; [&amp;lt;ffffffffa0cb7780&amp;gt;] ptlrpc_main+0xa40/0x1da0 [ptlrpc]
[37590.052054]&#160; [&amp;lt;ffffffff8109e8b9&amp;gt;] kthread+0xc9/0xe0
[37590.052060]&#160; [&amp;lt;ffffffff81616f45&amp;gt;] ret_from_fork+0x55/0x80
[37590.055121] (null)DWARF2 unwinder stuck at ret_from_fork+0x55/0x80
[37590.055121]&#160;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;On the console lgs for the other MDS, with MDT0 and MDT2, we see&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[37506.637291] Lustre: DEBUG MARKER: == racer test 1: racer on clients: trevis-8vm1,trevis-8vm2 DURATION=900 ============================== 22:31:21 (1521783081)
[37514.969720] Lustre: lustre-MDT0002: Client 92f575f3-55a8-8c4a-7087-ea3eadf4f6ae (at 10.9.4.81@tcp) reconnecting
[37518.255252] Lustre: lustre-MDT0002: Client b6648c6a-1d39-4917-499d-0676dd06ca4a (at 10.9.4.82@tcp) reconnecting
[37518.255258] Lustre: Skipped 1 previous similar message
[37519.663174] Lustre: lustre-MDT0000: Client b6648c6a-1d39-4917-499d-0676dd06ca4a (at 10.9.4.82@tcp) reconnecting
[37519.957482] LustreError: 20792:0:(mdt_open.c:1204:mdt_cross_open()) lustre-MDT0002: [0x280000405:0x74:0x0] doesn&apos;t exist!: rc = -14
[37562.012928] Lustre: lustre-MDT0000: Client 92f575f3-55a8-8c4a-7087-ea3eadf4f6ae (at 10.9.4.81@tcp) reconnecting
[37573.001921] Lustre: lustre-MDT0000: Client ea0330a2-74e9-672c-10d5-7c42a043d466 (at 10.9.4.82@tcp) reconnecting
[37573.001924] Lustre: Skipped 3 previous similar messages
[37619.168062] LNet: Service thread pid 20790 was inactive for 62.01s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace for debugging purposes:
[37619.168072] Pid: 20790, comm: mdt00_024
[37619.168072]
[37619.168072] Call Trace:
[37619.190751]&#160; [&amp;lt;ffffffff81612a95&amp;gt;] schedule+0x35/0x80
[37619.190757]&#160; [&amp;lt;ffffffff81615851&amp;gt;] schedule_timeout+0x161/0x2d0
[37619.191048]&#160; [&amp;lt;ffffffffa0977e3e&amp;gt;] ldlm_completion_ast+0x51e/0x860 [ptlrpc]
[37619.191133]&#160; [&amp;lt;ffffffffa0978f31&amp;gt;] ldlm_cli_enqueue_local+0x251/0x830 [ptlrpc]
[37619.191228]&#160; [&amp;lt;ffffffffa111a26e&amp;gt;] mdt_reint_rename_or_migrate.isra.40+0x5ee/0x7c0 [mdt]
[37619.191261]&#160; [&amp;lt;ffffffffa111e351&amp;gt;] mdt_reint_rec+0x71/0x1e0 [mdt]
[37619.191274]&#160; [&amp;lt;ffffffffa10ff59b&amp;gt;] mdt_reint_internal+0x59b/0x960 [mdt]
[37619.191299]&#160; [&amp;lt;ffffffffa1109d31&amp;gt;] mdt_reint+0x61/0x120 [mdt]
[37619.191344]&#160; [&amp;lt;ffffffffa0a0b44a&amp;gt;] tgt_request_handle+0x8ca/0x1330 [ptlrpc]
[37619.191393]&#160; [&amp;lt;ffffffffa09b48f8&amp;gt;] ptlrpc_server_handle_request+0x258/0xa60 [ptlrpc]
[37619.191436]&#160; [&amp;lt;ffffffffa09b8780&amp;gt;] ptlrpc_main+0xa40/0x1da0 [ptlrpc]
[37619.191453]&#160; [&amp;lt;ffffffff8109e8b9&amp;gt;] kthread+0xc9/0xe0
[37619.191468]&#160; [&amp;lt;ffffffff81616f45&amp;gt;] ret_from_fork+0x55/0x80
[37619.194162] (null)DWARF2 unwinder stuck at ret_from_fork+0x55/0x80
[37619.194163]
[37619.194163] (null)Leftover inexact backtrace:
[37619.194163]
[37619.194169]&#160; [&amp;lt;ffffffff8109e7f0&amp;gt;] ? kthread+0x0/0xe0
[37619.194169]
[37619.194176] LustreError: dumping log to /tmp/lustre-log.1521783194.20790
[37619.251541] Pid: 19230, comm: mdt00_001
[37619.251547]
[37619.251547] Call Trace:
[37619.251562]&#160; [&amp;lt;ffffffff81612a95&amp;gt;] schedule+0x35/0x80
[37619.251566]&#160; [&amp;lt;ffffffff81615851&amp;gt;] schedule_timeout+0x161/0x2d0
[37619.251643]&#160; [&amp;lt;ffffffffa0977e3e&amp;gt;] ldlm_completion_ast+0x51e/0x860 [ptlrpc]
[37619.251691]&#160; [&amp;lt;ffffffffa0979e15&amp;gt;] ldlm_cli_enqueue_fini+0x905/0xd80 [ptlrpc]
[37619.251727]&#160; [&amp;lt;ffffffffa097c119&amp;gt;] ldlm_cli_enqueue+0x3e9/0x8c0 [ptlrpc]
[37619.251767]&#160; [&amp;lt;ffffffffa12f34a2&amp;gt;] osp_md_object_lock+0x142/0x290 [osp]
[37619.251835]&#160; [&amp;lt;ffffffffa120a8fa&amp;gt;] lod_object_lock+0xda/0x910 [lod]
[37619.251871]&#160; [&amp;lt;ffffffffa1102d3d&amp;gt;] mdt_remote_object_lock_try+0x1dd/0x6e0 [mdt]
[37619.251885]&#160; [&amp;lt;ffffffffa1103269&amp;gt;] mdt_remote_object_lock+0x29/0x30 [mdt]
[37619.251898]&#160; [&amp;lt;ffffffffa1119f75&amp;gt;] mdt_reint_rename_or_migrate.isra.40+0x2f5/0x7c0 [mdt]
[37619.251913]&#160; [&amp;lt;ffffffffa111e351&amp;gt;] mdt_reint_rec+0x71/0x1e0 [mdt]
[37619.251926]&#160; [&amp;lt;ffffffffa10ff59b&amp;gt;] mdt_reint_internal+0x59b/0x960 [mdt]
[37619.251945]&#160; [&amp;lt;ffffffffa1109d31&amp;gt;] mdt_reint+0x61/0x120 [mdt]
[37619.251990]&#160; [&amp;lt;ffffffffa0a0b44a&amp;gt;] tgt_request_handle+0x8ca/0x1330 [ptlrpc]
[37619.252048]&#160; [&amp;lt;ffffffffa09b48f8&amp;gt;] ptlrpc_server_handle_request+0x258/0xa60 [ptlrpc]
[37619.252088]&#160; [&amp;lt;ffffffffa09b8780&amp;gt;] ptlrpc_main+0xa40/0x1da0 [ptlrpc]
[37619.252095]&#160; [&amp;lt;ffffffff8109e8b9&amp;gt;] kthread+0xc9/0xe0
[37619.252099]&#160; [&amp;lt;ffffffff81616f45&amp;gt;] ret_from_fork+0x55/0x80
[37619.254330] (null)DWARF2 unwinder stuck at ret_from_fork+0x55/0x80
[37619.254331]
[37619.254331] (null)Leftover inexact backtrace:
[37619.254331]
[37619.254334]&#160; [&amp;lt;ffffffff8109e7f0&amp;gt;] ? kthread+0x0/0xe0&#160;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;We have several ls, rm and mv processes in D state on client1:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[41311.155160] ls&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; D ffff880037d7a800&#160;&#160;&#160;&#160; 0 16699&#160;&#160;&#160;&#160;&#160; 1 0x00000004
[41311.155162]&#160; ffff8800488afc08 ffff88007a30c0d0 ffff88003f584ec0 ffff8800488b0000
[41311.155163]&#160; ffff88007a30c17c ffff88003f584ec0 00000000ffffffff ffff88007a30c180
[41311.155176]&#160; ffff8800488afc20 ffffffff81610a95 ffff88007a30c178 ffff8800488afc30
[41311.155177] Call Trace:
[41311.155181]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41311.155184]&#160; [&amp;lt;ffffffff81610d7e&amp;gt;] schedule_preempt_disabled+0xe/0x10
[41311.155186]&#160; [&amp;lt;ffffffff816125b5&amp;gt;] __mutex_lock_slowpath+0x95/0x110
[41311.155189]&#160; [&amp;lt;ffffffff81612643&amp;gt;] mutex_lock+0x13/0x22
[41311.155193]&#160; [&amp;lt;ffffffff81216760&amp;gt;] walk_component+0x170/0x240
[41311.155197]&#160; [&amp;lt;ffffffff81216c41&amp;gt;] link_path_walk+0x171/0x570
[41311.155199]&#160; [&amp;lt;ffffffff812174e2&amp;gt;] path_openat+0x92/0x12e0
[41311.155202]&#160; [&amp;lt;ffffffff8121a25e&amp;gt;] do_filp_open+0x7e/0xd0
[41311.155205]&#160; [&amp;lt;ffffffff81209f99&amp;gt;] do_sys_open+0x129/0x200
[41311.155209]&#160; [&amp;lt;ffffffff81614b0a&amp;gt;] entry_SYSCALL_64_fastpath+0x1e/0xb6
[41311.157343] DWARF2 unwinder stuck at entry_SYSCALL_64_fastpath+0x1e/0xb6
[41311.157343]
&#8230;
[41311.191802] Leftover inexact backtrace:
[41311.191802]
[41311.191806] rm&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; D ffff88007fd16440&#160;&#160;&#160;&#160; 0 19246&#160;&#160;&#160;&#160;&#160; 1 0x00000004
[41311.191808]&#160; ffff880063a5bc08 ffff88007a30c0d0 ffff880062f74e40 ffff880063a5c000
[41311.191809]&#160; ffff88007a30c17c ffff880062f74e40 00000000ffffffff ffff88007a30c180
[41311.191810]&#160; ffff880063a5bc20 ffffffff81610a95 ffff88007a30c178 ffff880063a5bc30
[41311.191811] Call Trace:
[41311.191814]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41311.191817]&#160; [&amp;lt;ffffffff81610d7e&amp;gt;] schedule_preempt_disabled+0xe/0x10
[41311.191819]&#160; [&amp;lt;ffffffff816125b5&amp;gt;] __mutex_lock_slowpath+0x95/0x110
[41311.191821]&#160; [&amp;lt;ffffffff81612643&amp;gt;] mutex_lock+0x13/0x22
[41311.191823]&#160; [&amp;lt;ffffffff81216760&amp;gt;] walk_component+0x170/0x240
[41311.191826]&#160; [&amp;lt;ffffffff81216c41&amp;gt;] link_path_walk+0x171/0x570
[41311.191829]&#160; [&amp;lt;ffffffff812174e2&amp;gt;] path_openat+0x92/0x12e0
[41311.191831]&#160; [&amp;lt;ffffffff8121a25e&amp;gt;] do_filp_open+0x7e/0xd0
[41311.191833]&#160; [&amp;lt;ffffffff81209f99&amp;gt;] do_sys_open+0x129/0x200
[41311.191836]&#160; [&amp;lt;ffffffff81614b0a&amp;gt;] entry_SYSCALL_64_fastpath+0x1e/0xb6
[41311.193957] DWARF2 unwinder stuck at entry_SYSCALL_64_fastpath+0x1e/0xb6
[41311.193957]
[41311.193958] Leftover inexact backtrace:
[41311.193958]
[41311.193962] mv&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; D ffff880063531040&#160;&#160;&#160;&#160; 0 19385&#160;&#160;&#160;&#160;&#160; 1 0x00000004
[41311.193964]&#160; ffff88005f1a3c28 ffff88007a30c0d0 ffff8800631091c0 ffff88005f1a4000
[41311.193965]&#160; ffff88007a30c17c ffff8800631091c0 00000000ffffffff ffff88007a30c180
[41311.193966]&#160; ffff88005f1a3c40 ffffffff81610a95 ffff88007a30c178 ffff88005f1a3c50
[41311.193967] Call Trace:
[41311.193970]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41311.193973]&#160; [&amp;lt;ffffffff81610d7e&amp;gt;] schedule_preempt_disabled+0xe/0x10
[41311.193975]&#160; [&amp;lt;ffffffff816125b5&amp;gt;] __mutex_lock_slowpath+0x95/0x110
[41311.193977]&#160; [&amp;lt;ffffffff81612643&amp;gt;] mutex_lock+0x13/0x22
[41311.193980]&#160; [&amp;lt;ffffffff81216760&amp;gt;] walk_component+0x170/0x240
[41311.193983]&#160; [&amp;lt;ffffffff81216c41&amp;gt;] link_path_walk+0x171/0x570
[41311.193985]&#160; [&amp;lt;ffffffff8121713f&amp;gt;] path_lookupat+0x7f/0x110
[41311.193987]&#160; [&amp;lt;ffffffff81219816&amp;gt;] filename_lookup+0x116/0x150
[41311.193991]&#160; [&amp;lt;ffffffff8120f7b9&amp;gt;] vfs_fstatat+0x49/0x90
[41311.193994]&#160; [&amp;lt;ffffffff8120fc7d&amp;gt;] SYSC_newlstat+0x1d/0x40
[41311.193996]&#160; [&amp;lt;ffffffff81614b0a&amp;gt;] entry_SYSCALL_64_fastpath+0x1e/0xb6
[41311.196113] DWARF2 unwinder stuck at entry_SYSCALL_64_fastpath+0x1e/0xb6
[41311.196114]&#160;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;On the other client ls, ln, getfattr in D state:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[41317.513265] Leftover inexact backtrace:
[41317.513265]
[41317.513269] ls&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; D ffff88005ae9c800&#160;&#160;&#160;&#160; 0&#160; 6830&#160;&#160;&#160;&#160;&#160; 1 0x00000004
[41317.513270]&#160; ffff880054e5bc08 ffff880052367bd0 ffff88006426c940 ffff880054e5c000
[41317.513272]&#160; ffff880052367c7c ffff88006426c940 00000000ffffffff ffff880052367c80
[41317.513273]&#160; ffff880054e5bc20 ffffffff81610a95 ffff880052367c78 ffff880054e5bc30
[41317.513273] Call Trace:
[41317.513277]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41317.513279]&#160; [&amp;lt;ffffffff81610d7e&amp;gt;] schedule_preempt_disabled+0xe/0x10
[41317.513281]&#160; [&amp;lt;ffffffff816125b5&amp;gt;] __mutex_lock_slowpath+0x95/0x110
[41317.513284]&#160; [&amp;lt;ffffffff81612643&amp;gt;] mutex_lock+0x13/0x22
[41317.513286]&#160; [&amp;lt;ffffffff81216760&amp;gt;] walk_component+0x170/0x240
[41317.513289]&#160; [&amp;lt;ffffffff81216c41&amp;gt;] link_path_walk+0x171/0x570
[41317.513291]&#160; [&amp;lt;ffffffff812174e2&amp;gt;] path_openat+0x92/0x12e0
[41317.513294]&#160; [&amp;lt;ffffffff8121a2a8&amp;gt;] do_filp_open+0xc8/0xd0
[41317.513296]&#160; [&amp;lt;ffffffff81209f99&amp;gt;] do_sys_open+0x129/0x200
[41317.513299]&#160; [&amp;lt;ffffffff81614b0a&amp;gt;] entry_SYSCALL_64_fastpath+0x1e/0xb6
[41317.515417] DWARF2 unwinder stuck at entry_SYSCALL_64_fastpath+0x1e/0xb6
[41317.515417]
[41317.515417] Leftover inexact backtrace:
[41317.515417]
[41317.515421] getfattr&#160;&#160;&#160;&#160;&#160;&#160;&#160; D ffff880060adb800&#160;&#160;&#160;&#160; 0&#160; 7898&#160;&#160;&#160;&#160;&#160; 1 0x00000004
[41317.515422]&#160; ffff88005bc17c28 ffff880052367bd0 ffff88005fb45200 ffff88005bc18000
[41317.515424]&#160; ffff880052367c7c ffff88005fb45200 00000000ffffffff ffff880052367c80
[41317.515425]&#160; ffff88005bc17c40 ffffffff81610a95 ffff880052367c78 ffff88005bc17c50
[41317.515425] Call Trace:
[41317.515429]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41317.515431]&#160; [&amp;lt;ffffffff81610d7e&amp;gt;] schedule_preempt_disabled+0xe/0x10
[41317.515433]&#160; [&amp;lt;ffffffff816125b5&amp;gt;] __mutex_lock_slowpath+0x95/0x110
[41317.515436]&#160; [&amp;lt;ffffffff81612643&amp;gt;] mutex_lock+0x13/0x22
[41317.515438]&#160; [&amp;lt;ffffffff81216760&amp;gt;] walk_component+0x170/0x240
[41317.515441]&#160; [&amp;lt;ffffffff81216c41&amp;gt;] link_path_walk+0x171/0x570
[41317.515443]&#160; [&amp;lt;ffffffff8121713f&amp;gt;] path_lookupat+0x7f/0x110
[41317.515446]&#160; [&amp;lt;ffffffff81219816&amp;gt;] filename_lookup+0x116/0x150
[41317.515449]&#160; [&amp;lt;ffffffff8120f7b9&amp;gt;] vfs_fstatat+0x49/0x90
[41317.515452]&#160; [&amp;lt;ffffffff8120fc3a&amp;gt;] SYSC_newstat+0x1a/0x40
[41317.515454]&#160; [&amp;lt;ffffffff81614b0a&amp;gt;] entry_SYSCALL_64_fastpath+0x1e/0xb6
[41317.517582] DWARF2 unwinder stuck at entry_SYSCALL_64_fastpath+0x1e/0xb6
[41317.517582]
[41317.517582] Leftover inexact backtrace:
[41317.517582]
[41317.517586] ln&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; D 0000000000000001&#160;&#160;&#160;&#160; 0&#160; 8542&#160;&#160;&#160;&#160;&#160; 1 0x00000004
[41317.517587]&#160; ffff88005b603c68 ffff880052367bd0 ffff88005f270040 ffff88005b604000
[41317.517588]&#160; ffff880052367c7c ffff88005f270040 00000000ffffffff ffff880052367c80
[41317.517589]&#160; ffff88005b603c80 ffffffff81610a95 ffff880052367c78 ffff88005b603c90
[41317.517590] Call Trace:
[41317.517593]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41317.517596]&#160; [&amp;lt;ffffffff81610d7e&amp;gt;] schedule_preempt_disabled+0xe/0x10
[41317.517598]&#160; [&amp;lt;ffffffff816125b5&amp;gt;] __mutex_lock_slowpath+0x95/0x110
[41317.517600]&#160; [&amp;lt;ffffffff81612643&amp;gt;] mutex_lock+0x13/0x22
[41317.517602]&#160; [&amp;lt;ffffffff81216760&amp;gt;] walk_component+0x170/0x240
[41317.517606]&#160; [&amp;lt;ffffffff81216c41&amp;gt;] link_path_walk+0x171/0x570
[41317.517610]&#160; [&amp;lt;ffffffff8121713f&amp;gt;] path_lookupat+0x7f/0x110
[41317.517612]&#160; [&amp;lt;ffffffff8121979c&amp;gt;] filename_lookup+0x9c/0x150
[41317.517615]&#160; [&amp;lt;ffffffff8121ac38&amp;gt;] SyS_linkat+0x68/0x2e0
[41317.517617]&#160; [&amp;lt;ffffffff81614b0a&amp;gt;] entry_SYSCALL_64_fastpath+0x1e/0xb6
[41317.519736] DWARF2 unwinder stuck at entry_SYSCALL_64_fastpath+0x1e/0xb6
[41317.519737]
[41317.519737] Leftover inexact backtrace:
[41317.519737]
[41317.519740] ldlm_bl_05&#160;&#160;&#160;&#160;&#160; S 0000000000000001&#160;&#160;&#160;&#160; 0&#160; 8829&#160;&#160;&#160;&#160;&#160; 2 0x00000000
[41317.519742]&#160; ffff880058353e18 ffff88005a8b9418 ffff8800576758c0 ffff880058354000
[41317.519743]&#160; ffff88005731d6a4 0000000000000000 ffff8800576758c0 ffff88005731d668
[41317.519744]&#160; ffff880058353e30 ffffffff81610a95 ffff88005731d640 ffff8800576758c0
[41317.519744] Call Trace:
[41317.519748]&#160; [&amp;lt;ffffffff81610a95&amp;gt;] schedule+0x35/0x80
[41317.519770]&#160; [&amp;lt;ffffffffa0b4a510&amp;gt;] ldlm_bl_thread_main+0x3f0/0x690 [ptlrpc]
[41317.519774]&#160; [&amp;lt;ffffffff8109e8f9&amp;gt;] kthread+0xc9/0xe0
[41317.519777]&#160; [&amp;lt;ffffffff81614f45&amp;gt;] ret_from_fork+0x55/0x80
[41317.521908] DWARF2 unwinder stuck at ret_from_fork+0x55/0x80
[41317.521908]
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Logs for this hang are at:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/49a29a5e-2f2f-11e8-9e0e-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/49a29a5e-2f2f-11e8-9e0e-52540065bddc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/97cda774-274a-11e8-9e0e-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/97cda774-274a-11e8-9e0e-52540065bddc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/9efd8706-276a-11e8-9e0e-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/9efd8706-276a-11e8-9e0e-52540065bddc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/444c303c-2e36-11e8-9e0e-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/444c303c-2e36-11e8-9e0e-52540065bddc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</description>
                <environment></environment>
        <key id="51515">LU-10852</key>
            <summary>racer test 1 hangs in locking</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="3" iconUrl="https://jira.whamcloud.com/images/icons/statuses/inprogress.png" description="This issue is being actively worked on at the moment by the assignee.">In Progress</status>
                    <statusCategory id="4" key="indeterminate" colorName="inprogress"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="jamesanunez">James Nunez</reporter>
                        <labels>
                            <label>DNE</label>
                    </labels>
                <created>Mon, 26 Mar 2018 21:34:06 +0000</created>
                <updated>Thu, 19 Nov 2020 20:12:08 +0000</updated>
                                            <version>Lustre 2.11.0</version>
                    <version>Lustre 2.12.0</version>
                    <version>Lustre 2.12.6</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="224632" author="pjones" created="Tue, 27 Mar 2018 18:04:18 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;Can you please advise?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="224998" author="laisiyao" created="Tue, 3 Apr 2018 05:47:23 +0000"  >&lt;p&gt;This is a bug in migration code: if migrating file has link, and if the parent of the link is the same as source object parent, it will deadlock, because the source object parent was locked already, and herein it tries to lock again. I&apos;ve fixed this issue in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4684&quot; title=&quot;DNE3: allow migrating DNE striped directory&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4684&quot;&gt;&lt;del&gt;LU-4684&lt;/del&gt;&lt;/a&gt;, so maybe it&apos;s not necessary to fix it since dir migration is not officially supported yet.&lt;/p&gt;</comment>
                            <comment id="233340" author="pjones" created="Tue, 11 Sep 2018 17:22:44 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;Is the fix in one of the unlanded patches for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4684&quot; title=&quot;DNE3: allow migrating DNE striped directory&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4684&quot;&gt;&lt;del&gt;LU-4684&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="233369" author="laisiyao" created="Wed, 12 Sep 2018 01:41:35 +0000"  >&lt;p&gt;yes, Peter.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzusv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>