<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:55:22 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-5886] DNE II Testing: Hung threads on MDS; evictions</title>
                <link>https://jira.whamcloud.com/browse/LU-5886</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;During DNE II testing (same run as &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5883&quot; title=&quot;DNE II testing: LustreError: 6618:0:(statahead.c:262:sa_kill()) ASSERTION( !list_empty(&amp;amp;entry-&amp;gt;se_list) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5883&quot;&gt;&lt;del&gt;LU-5883&lt;/del&gt;&lt;/a&gt;), both of our  MDSes reported hung threads here:&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: Pid: 21117, comm: mdt02_008&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel:&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: Call Trace:&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0aaa1a1&amp;gt;&amp;#93;&lt;/span&gt; ? libcfs_debug_msg+0x41/0x50 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e32230&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_expired_completion_wait+0x0/0x360 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e36df5&amp;gt;&amp;#93;&lt;/span&gt; ldlm_completion_ast+0x665/0x9a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81065df0&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e3619e&amp;gt;&amp;#93;&lt;/span&gt; ldlm_cli_enqueue_local+0x21e/0x810 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e36790&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_completion_ast+0x0/0x9a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa1559d70&amp;gt;&amp;#93;&lt;/span&gt; ? mdt_blocking_ast+0x0/0x2a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa156240d&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_local_lock+0x1bd/0xa80 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa1559d70&amp;gt;&amp;#93;&lt;/span&gt; ? mdt_blocking_ast+0x0/0x2a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e36790&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_completion_ast+0x0/0x9a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa1562d35&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_lock_internal+0x65/0x360 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa15630f4&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_lock+0x14/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa156dd6c&amp;gt;&amp;#93;&lt;/span&gt; mdt_getattr_name_lock+0xd9c/0x1a50 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8128a0ea&amp;gt;&amp;#93;&lt;/span&gt; ? strlcpy+0x4a/0x60&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e63774&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_flags+0x34/0xb0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e65d40&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_swab_ldlm_reply+0x0/0x40 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa156ef42&amp;gt;&amp;#93;&lt;/span&gt; mdt_intent_getattr+0x292/0x470 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa155bc44&amp;gt;&amp;#93;&lt;/span&gt; mdt_intent_policy+0x494/0xcf0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e16549&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_enqueue+0x129/0x9d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4235b&amp;gt;&amp;#93;&lt;/span&gt; ldlm_handle_enqueue0+0x51b/0x1340 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0a9a4ce&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_timer_arm+0xe/0x10 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ec3842&amp;gt;&amp;#93;&lt;/span&gt; tgt_enqueue+0x62/0x1d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ec40ce&amp;gt;&amp;#93;&lt;/span&gt; tgt_request_handle+0x71e/0xb10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e73964&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0xe64/0x1990 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810096f0&amp;gt;&amp;#93;&lt;/span&gt; ? __switch_to+0xd0/0x320&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81527c20&amp;gt;&amp;#93;&lt;/span&gt; ? thread_return+0x4e/0x76e&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e72b00&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x1990 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8109aee6&amp;gt;&amp;#93;&lt;/span&gt; kthread+0x96/0xa0&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c20a&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8109ae50&amp;gt;&amp;#93;&lt;/span&gt; ? kthread+0x0/0xa0&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c200&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
Nov  6 20:22:21 perses-esf-mds001 kernel:&lt;/p&gt;</description>
                <environment>Versions of 2.6.54 on clients &amp;amp; servers.&lt;br/&gt;
Cray SLES11SP3 clients, CentOS servers (2.6.32-431.5.1.el6.x86_64).&lt;br/&gt;
&lt;br/&gt;
Most recent commit on clients:&lt;br/&gt;
Ie7a2a98be8cc97db9af7a64476c06fc7321544eb&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/12142&quot;&gt;http://review.whamcloud.com/12142&lt;/a&gt;&lt;br/&gt;
&lt;br/&gt;
Most recent commit on servers:&lt;br/&gt;
If24443955290b091fd22905dfb74b0d6a6d1b4e8&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/12490&quot;&gt;http://review.whamcloud.com/12490&lt;/a&gt;</environment>
        <key id="27511">LU-5886</key>
            <summary>DNE II Testing: Hung threads on MDS; evictions</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="di.wang">Di Wang</assignee>
                                    <reporter username="paf">Patrick Farrell</reporter>
                        <labels>
                    </labels>
                <created>Fri, 7 Nov 2014 20:33:14 +0000</created>
                <updated>Sun, 10 Oct 2021 22:20:22 +0000</updated>
                            <resolved>Sun, 10 Oct 2021 22:20:22 +0000</resolved>
                                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="98696" author="paf" created="Fri, 7 Nov 2014 20:34:10 +0000"  >&lt;p&gt;Partial Lustre logs and messages logs from both MDSes are here:&lt;br/&gt;
ftp.whamcloud.com/uploads/&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5886&quot; title=&quot;DNE II Testing: Hung threads on MDS; evictions&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5886&quot;&gt;&lt;del&gt;LU-5886&lt;/del&gt;&lt;/a&gt;/lustre_logs_and_messages.tar.gz&lt;/p&gt;</comment>
                            <comment id="98779" author="jlevi" created="Mon, 10 Nov 2014 18:07:16 +0000"  >&lt;p&gt;Di,&lt;br/&gt;
Would you be able to comment on this one?&lt;br/&gt;
Thank you!&lt;/p&gt;</comment>
                            <comment id="99006" author="di.wang" created="Wed, 12 Nov 2014 20:31:44 +0000"  >&lt;p&gt;According to the console log, both MDTs are waiting for the lock of a remote directory.&lt;/p&gt;

&lt;p&gt;mds001&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Nov  6 20:22:21 perses-esf-mds001 kernel: Call Trace:
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0aaa1a1&amp;gt;] ? libcfs_debug_msg+0x41/0x50 [libcfs]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e32230&amp;gt;] ? ldlm_expired_completion_wait+0x0/0x360 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e36df5&amp;gt;] ldlm_completion_ast+0x665/0x9a0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff81065df0&amp;gt;] ? default_wake_function+0x0/0x20
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e3619e&amp;gt;] ldlm_cli_enqueue_local+0x21e/0x810 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e36790&amp;gt;] ? ldlm_completion_ast+0x0/0x9a0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa1559d70&amp;gt;] ? mdt_blocking_ast+0x0/0x2a0 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa156240d&amp;gt;] mdt_object_local_lock+0x1bd/0xa80 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa1559d70&amp;gt;] ? mdt_blocking_ast+0x0/0x2a0 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e36790&amp;gt;] ? ldlm_completion_ast+0x0/0x9a0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa1562d35&amp;gt;] mdt_object_lock_internal+0x65/0x360 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa15630f4&amp;gt;] mdt_object_lock+0x14/0x20 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa156dd6c&amp;gt;] mdt_getattr_name_lock+0xd9c/0x1a50 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff8128a0ea&amp;gt;] ? strlcpy+0x4a/0x60
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e63774&amp;gt;] ? lustre_msg_get_flags+0x34/0xb0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e65d40&amp;gt;] ? lustre_swab_ldlm_reply+0x0/0x40 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa156ef42&amp;gt;] mdt_intent_getattr+0x292/0x470 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa155bc44&amp;gt;] mdt_intent_policy+0x494/0xcf0 [mdt]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e16549&amp;gt;] ldlm_lock_enqueue+0x129/0x9d0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e4235b&amp;gt;] ldlm_handle_enqueue0+0x51b/0x1340 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0a9a4ce&amp;gt;] ? cfs_timer_arm+0xe/0x10 [libcfs]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0ec3842&amp;gt;] tgt_enqueue+0x62/0x1d0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0ec40ce&amp;gt;] tgt_request_handle+0x71e/0xb10 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e73964&amp;gt;] ptlrpc_main+0xe64/0x1990 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff810096f0&amp;gt;] ? __switch_to+0xd0/0x320
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff81527c20&amp;gt;] ? thread_return+0x4e/0x76e
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffffa0e72b00&amp;gt;] ? ptlrpc_main+0x0/0x1990 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff8109aee6&amp;gt;] kthread+0x96/0xa0
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff8100c20a&amp;gt;] child_rip+0xa/0x20
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff8109ae50&amp;gt;] ? kthread+0x0/0xa0
Nov  6 20:22:21 perses-esf-mds001 kernel: [&amp;lt;ffffffff8100c200&amp;gt;] ? child_rip+0x0/0x20
Nov  6 20:22:21 perses-esf-mds001 kernel: 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;mds002&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Nov  6 20:22:16 perses-esf-mds002 kernel:  req@ffff8803330e1c00 x1484073163441132/t0(0) o36-&amp;gt;ca4f794c-56f5-709e-3a90-0c25c515ac58@30@gni:0/0 lens 552/568 e 18 to 0 dl 1415326941 ref 2 fl Interpret:/0/0 rc 0/0
Nov  6 20:22:21 perses-esf-mds002 kernel: LNet: Service thread pid 10838 was inactive for 600.00s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace for debugging purposes:
Nov  6 20:22:21 perses-esf-mds002 kernel: Pid: 10838, comm: mdt02_000
Nov  6 20:22:21 perses-esf-mds002 kernel: 
Nov  6 20:22:21 perses-esf-mds002 kernel: Call Trace:
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e01230&amp;gt;] ? ldlm_expired_completion_wait+0x0/0x360 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e05df5&amp;gt;] ldlm_completion_ast+0x665/0x9a0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff81065df0&amp;gt;] ? default_wake_function+0x0/0x20
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0dffe76&amp;gt;] ldlm_cli_enqueue_fini+0x926/0xe60 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e00761&amp;gt;] ldlm_cli_enqueue+0x3b1/0x860 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e05790&amp;gt;] ? ldlm_completion_ast+0x0/0x9a0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa1502b60&amp;gt;] ? mdt_remote_blocking_ast+0x0/0x210 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa16d94a8&amp;gt;] osp_md_object_lock+0x188/0x210 [osp]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa15f70bf&amp;gt;] lod_object_lock+0x13f/0x730 [lod]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa166913b&amp;gt;] mdd_object_lock+0x3b/0xd0 [mdd]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa150b07c&amp;gt;] mdt_remote_object_lock+0x14c/0x320 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa150bdee&amp;gt;] mdt_object_lock_internal+0x11e/0x360 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa150c0f4&amp;gt;] mdt_object_lock+0x14/0x20 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa1526f80&amp;gt;] mdt_reint_create+0x700/0xd40 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0c216b0&amp;gt;] ? lu_ucred+0x20/0x30 [obdclass]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa1501ed5&amp;gt;] ? mdt_ucred+0x15/0x20 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa151deec&amp;gt;] ? mdt_root_squash+0x2c/0x3f0 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e57a56&amp;gt;] ? __req_capsule_get+0x166/0x6e0 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff8128a0ea&amp;gt;] ? strlcpy+0x4a/0x60
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa15220fd&amp;gt;] mdt_reint_rec+0x5d/0x200 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa15061a3&amp;gt;] mdt_reint_internal+0x4d3/0x7b0 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa1506a0b&amp;gt;] mdt_reint+0x6b/0x120 [mdt]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e930ce&amp;gt;] tgt_request_handle+0x71e/0xb10 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e42964&amp;gt;] ptlrpc_main+0xe64/0x1990 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff810096f0&amp;gt;] ? __switch_to+0xd0/0x320
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff81527c20&amp;gt;] ? thread_return+0x4e/0x76e
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffffa0e41b00&amp;gt;] ? ptlrpc_main+0x0/0x1990 [ptlrpc]
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff8109aee6&amp;gt;] kthread+0x96/0xa0
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff8100c20a&amp;gt;] child_rip+0xa/0x20
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff8109ae50&amp;gt;] ? kthread+0x0/0xa0
Nov  6 20:22:21 perses-esf-mds002 kernel: [&amp;lt;ffffffff8100c200&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Unfortunately, the debug log you posted is about 1 hour earlier,  could you be able to find these debug log&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Nov  6 20:22:21 perses-esf-mds002 kernel: 
Nov  6 20:22:21 perses-esf-mds002 kernel: LustreError: dumping log to /tmp/lustre-log.1415326941.10838
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Nov  6 20:22:21 perses-esf-mds001 kernel: LustreError: dumping log to /tmp/lustre-log.1415326941.21117
Nov  6 20:24:27 perses-esf-mds001 kernel: Lustre: lock timed out (enqueued at 1415326767, 300s ago)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Though I am not sure there are valuable information there, but worth try. Thanks.&lt;/p&gt;</comment>
                            <comment id="125244" author="di.wang" created="Wed, 26 Aug 2015 18:12:35 +0000"  >&lt;p&gt;Patrick, could you please try current master to see if you can still reproduce the problem? Thanks.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzx0i7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>16457</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>