<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:42:25 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-4403] ASSERTION( lock-&gt;l_readers &gt; 0 )</title>
                <link>https://jira.whamcloud.com/browse/LU-4403</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;&amp;lt;0&amp;gt;LustreError: 5766:0:(ldlm_lock.c:851:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&amp;gt;l_readers &amp;gt; 0 ) failed: ^M&lt;br/&gt;
&amp;lt;0&amp;gt;LustreError: 5766:0:(ldlm_lock.c:851:ldlm_lock_decref_internal_nolock()) LBUG^M&lt;br/&gt;
&amp;lt;4&amp;gt;Pid: 5766, comm: mdt00_020^M&lt;br/&gt;
&amp;lt;4&amp;gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt;Call Trace:^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0414895&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x55/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0414e97&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x47/0xb0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b03b2&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal_nolock+0xd2/0x180 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b4aad&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal+0x4d/0xaa0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa054a315&amp;gt;&amp;#93;&lt;/span&gt; ? class_handle2object+0x95/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b5f69&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_decref+0x39/0x90 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0dd74a3&amp;gt;&amp;#93;&lt;/span&gt; mdt_save_lock+0x63/0x300 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06fd900&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_swab_ldlm_reply+0x0/0x40 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0dd779c&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_unlock+0x5c/0x160 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e05a4c&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_open_unlock+0xac/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e0c9b4&amp;gt;&amp;#93;&lt;/span&gt; mdt_reint_open+0xdd4/0x20e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e0e34c&amp;gt;&amp;#93;&lt;/span&gt; mdt_reconstruct_open+0x68c/0xc30 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa07226a6&amp;gt;&amp;#93;&lt;/span&gt; ? __req_capsule_get+0x166/0x700 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06fb1ae&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_pack_reply_flags+0xae/0x1f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e01195&amp;gt;&amp;#93;&lt;/span&gt; mdt_reconstruct+0x45/0x120 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddccfb&amp;gt;&amp;#93;&lt;/span&gt; mdt_reint_internal+0x6bb/0x780 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddd08d&amp;gt;&amp;#93;&lt;/span&gt; mdt_intent_reint+0x1ed/0x520 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddaf3e&amp;gt;&amp;#93;&lt;/span&gt; mdt_intent_policy+0x39e/0x720 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b27e1&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_enqueue+0x361/0x8d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06d924f&amp;gt;&amp;#93;&lt;/span&gt; ldlm_handle_enqueue0+0x4ef/0x10b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddb3c6&amp;gt;&amp;#93;&lt;/span&gt; mdt_enqueue+0x46/0xe0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0de1ab7&amp;gt;&amp;#93;&lt;/span&gt; mdt_handle_common+0x647/0x16d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e1b2b5&amp;gt;&amp;#93;&lt;/span&gt; mds_regular_handle+0x15/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa070b428&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request+0x398/0xc60 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa04155de&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_timer_arm+0xe/0x10 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0426dbf&amp;gt;&amp;#93;&lt;/span&gt; ? lc_watchdog_touch+0x6f/0x170 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0702789&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_wait_event+0xa9/0x290 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810557f3&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up+0x53/0x70^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa070c7be&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0xace/0x1700 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa070bcf0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x1700 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0ca&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa070bcf0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x1700 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa070bcf0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x1700 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
&amp;lt;4&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0c0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20^M&lt;br/&gt;
&amp;lt;4&amp;gt;^M&lt;/p&gt;</description>
                <environment></environment>
        <key id="22534">LU-4403</key>
            <summary>ASSERTION( lock-&gt;l_readers &gt; 0 )</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="jay">Jinshan Xiong</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                            <label>llnl</label>
                            <label>mn4</label>
                    </labels>
                <created>Fri, 20 Dec 2013 04:33:41 +0000</created>
                <updated>Mon, 4 Aug 2014 23:57:07 +0000</updated>
                            <resolved>Sat, 8 Feb 2014 05:32:12 +0000</resolved>
                                    <version>Lustre 2.4.1</version>
                                    <fixVersion>Lustre 2.6.0</fixVersion>
                    <fixVersion>Lustre 2.5.2</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>10</watches>
                                                                            <comments>
                            <comment id="73927" author="pjones" created="Fri, 20 Dec 2013 12:42:03 +0000"  >&lt;p&gt;Mike&lt;/p&gt;

&lt;p&gt;Do you think that this might be related to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4135&quot; title=&quot;mdt_save_lock() is broken&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4135&quot;&gt;&lt;del&gt;LU-4135&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="73963" author="di.wang" created="Fri, 20 Dec 2013 19:58:17 +0000"  >&lt;p&gt;IMHO, the fix in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4135&quot; title=&quot;mdt_save_lock() is broken&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4135&quot;&gt;&lt;del&gt;LU-4135&lt;/del&gt;&lt;/a&gt; only fix the problem in master, which does not exist in b2_4. So this should be different issue, I will take a look now.&lt;/p&gt;</comment>
                            <comment id="73968" author="di.wang" created="Fri, 20 Dec 2013 21:19:44 +0000"  >&lt;p&gt;It seems this is caused by the race between mdt_intent_fixup_resend and mdt_object_unlock, i.e. mdt_intent_fixup_resend might return a released lock here. Here is the patch &lt;a href=&quot;http://review.whamcloud.com/8642&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8642&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="73983" author="tappro" created="Sat, 21 Dec 2013 12:30:26 +0000"  >&lt;p&gt;Thanks Di!&lt;/p&gt;</comment>
                            <comment id="74181" author="di.wang" created="Tue, 31 Dec 2013 01:11:32 +0000"  >&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/8680&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8680&lt;/a&gt; patch for master.&lt;/p&gt;</comment>
                            <comment id="74209" author="jaylan" created="Wed, 1 Jan 2014 00:20:23 +0000"  >&lt;p&gt;We just hit the same problem half an hour ago. The MDS runs the lustre server with patch #8642 included.&lt;/p&gt;</comment>
                            <comment id="74210" author="pjones" created="Wed, 1 Jan 2014 02:10:26 +0000"  >&lt;p&gt;Jay&lt;/p&gt;

&lt;p&gt;How long has the patch been applied? Is it possible to ascertain yet whether the frequency of occurrence has been altered since it was applied?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="74211" author="di.wang" created="Wed, 1 Jan 2014 04:50:34 +0000"  >&lt;p&gt;Jay,&lt;/p&gt;

&lt;p&gt;Same stack trace? If not, please post here. Are there any other console error messages? &lt;/p&gt;

&lt;p&gt;WangDi&lt;/p&gt;</comment>
                            <comment id="74212" author="mhanafi" created="Wed, 1 Jan 2014 05:27:26 +0000"  >&lt;p&gt;Here is the stack trace.&lt;/p&gt;

&lt;p&gt;bp7-mds1 login: Lustre: MGS: haven&apos;t heard from client fd1923ac-e3da-a3a1-46c2-d0613e7a86a3 (at 10.151.0.150@o2ib) in 227 seconds. I think it&apos;s dead, and I am evicting it. exp ffff880696019800, cur 1388538333 expire 1388538183 last 1388538106^M&lt;br/&gt;
Lustre: Skipped 6 previous similar messages^M&lt;br/&gt;
CONSOLE MARK 201312311730&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;-- MARK -- Tue Dec 31 18:00:00 2013&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
CONSOLE MARK 201312311830&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;-- MARK -- Tue Dec 31 19:00:00 2013&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
LustreError: 5827:0:(ldlm_lock.c:851:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&amp;gt;l_readers &amp;gt; 0 ) failed: ^M&lt;br/&gt;
LustreError: 5827:0:(ldlm_lock.c:851:ldlm_lock_decref_internal_nolock()) LBUG^M&lt;br/&gt;
Pid: 5827, comm: mdt01_041^M&lt;br/&gt;
^M&lt;br/&gt;
Call Trace:^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0414895&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x55/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0414e97&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x47/0xb0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b03b2&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal_nolock+0xd2/0x180 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b4aad&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal+0x4d/0xaa0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa054a315&amp;gt;&amp;#93;&lt;/span&gt; ? class_handle2object+0x95/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b5f69&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_decref+0x39/0x90 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0dd74a3&amp;gt;&amp;#93;&lt;/span&gt; mdt_save_lock+0x63/0x300 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06fd900&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_swab_ldlm_reply+0x0/0x40 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0dd779c&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_unlock+0x5c/0x160 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e05a5c&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_open_unlock+0xac/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e0c9c4&amp;gt;&amp;#93;&lt;/span&gt; mdt_reint_open+0xdd4/0x20e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e0e35c&amp;gt;&amp;#93;&lt;/span&gt; mdt_reconstruct_open+0x68c/0xc30 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa07226a6&amp;gt;&amp;#93;&lt;/span&gt; ? __req_capsule_get+0x166/0x700 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06fb1ae&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_pack_reply_flags+0xae/0x1f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e011a5&amp;gt;&amp;#93;&lt;/span&gt; mdt_reconstruct+0x45/0x120 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddcd0b&amp;gt;&amp;#93;&lt;/span&gt; mdt_reint_internal+0x6bb/0x780 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddd09d&amp;gt;&amp;#93;&lt;/span&gt; mdt_intent_reint+0x1ed/0x520 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0ddaf4e&amp;gt;&amp;#93;&lt;/span&gt; mdt_intent_policy+0x39e/0x720 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06b27e1&amp;gt;&amp;#93;&lt;/span&gt; ldlm_lock_enqueue+0x361/0x8d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;^M&lt;br/&gt;
^M&lt;br/&gt;
Entering kdb (current=0xffff88067f709540, pid 5827) on processor 12 Oops: (null)^M&lt;/p&gt;</comment>
                            <comment id="74213" author="mhanafi" created="Wed, 1 Jan 2014 05:53:04 +0000"  >&lt;p&gt;One thing to note: when the MDS hits this lbug several OSS will crash here is their bt.&lt;br/&gt;
crash&amp;gt; bt&lt;br/&gt;
PID: 12506  TASK: ffff880efef7b540  CPU: 11  COMMAND: &quot;ll_ost_io03_077&quot;&lt;br/&gt;
 #0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d150&amp;#93;&lt;/span&gt; machine_kexec at ffffffff81035d2b&lt;br/&gt;
 #1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d1b0&amp;#93;&lt;/span&gt; crash_kexec at ffffffff810c0412&lt;br/&gt;
 #2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d280&amp;#93;&lt;/span&gt; kdb_kdump_check at ffffffff81285507&lt;br/&gt;
 #3 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d290&amp;#93;&lt;/span&gt; kdb_main_loop at ffffffff812886f7&lt;br/&gt;
 #4 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d3a0&amp;#93;&lt;/span&gt; kdb_save_running at ffffffff8128285e&lt;br/&gt;
 #5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d3b0&amp;#93;&lt;/span&gt; kdba_main_loop at ffffffff81463518&lt;br/&gt;
 #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d3f0&amp;#93;&lt;/span&gt; kdb at ffffffff812859f6&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d460&amp;#93;&lt;/span&gt; kdba_entry at ffffffff81462e37&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d470&amp;#93;&lt;/span&gt; notifier_call_chain at ffffffff81544b85&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d4b0&amp;#93;&lt;/span&gt; atomic_notifier_call_chain at ffffffff81544bea&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d4c0&amp;#93;&lt;/span&gt; notify_die at ffffffff8109c15e&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d4f0&amp;#93;&lt;/span&gt; __die at ffffffff81542a52&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d520&amp;#93;&lt;/span&gt; die at ffffffff8100f288&lt;br/&gt;
#13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d550&amp;#93;&lt;/span&gt; do_general_protection at ffffffff81542632&lt;br/&gt;
#14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d580&amp;#93;&lt;/span&gt; general_protection at ffffffff81541dc5&lt;br/&gt;
    &lt;span class=&quot;error&quot;&gt;&amp;#91;exception RIP: lqe64_hash_keycmp+12&amp;#93;&lt;/span&gt;&lt;br/&gt;
    RIP: ffffffffa0bf8f2c  RSP: ffff880efef7d630  RFLAGS: 00010206&lt;br/&gt;
    RAX: 000000000000114b  RBX: ffff880fd044f680  RCX: 0000000000000000&lt;br/&gt;
    RDX: 0000000000000000  RSI: 5a5a5a5a5a5a5a5a  RDI: ffff880f11a5ef60&lt;br/&gt;
    RBP: ffff880efef7d630   R8: 0000000000000003   R9: 0000000000000001&lt;br/&gt;
    R10: 0000000000000001  R11: 0000000000000000  R12: ffff880efef7d6c0&lt;br/&gt;
    R13: ffff880f11a5ef60  R14: 0000000000000000  R15: 5a5a5a5a5a5a5a5a&lt;br/&gt;
    ORIG_RAX: ffffffffffffffff  CS: 0010  SS: 0018&lt;br/&gt;
#15 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d638&amp;#93;&lt;/span&gt; cfs_hash_bd_lookup_intent at ffffffffa04269e5 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
#16 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d688&amp;#93;&lt;/span&gt; cfs_hash_dual_bd_lookup_locked at ffffffffa0426b67 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
#17 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d6b8&amp;#93;&lt;/span&gt; cfs_hash_lookup at ffffffffa0427da4 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
#18 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d708&amp;#93;&lt;/span&gt; lqe_locate at ffffffffa0bf94f7 &lt;span class=&quot;error&quot;&gt;&amp;#91;lquota&amp;#93;&lt;/span&gt;&lt;br/&gt;
#19 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d748&amp;#93;&lt;/span&gt; qsd_op_begin at ffffffffa0c0c2bf &lt;span class=&quot;error&quot;&gt;&amp;#91;lquota&amp;#93;&lt;/span&gt;&lt;br/&gt;
#20 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d7e8&amp;#93;&lt;/span&gt; osd_declare_qid at ffffffffa0d0ac76 &lt;span class=&quot;error&quot;&gt;&amp;#91;osd_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
#21 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d848&amp;#93;&lt;/span&gt; osd_declare_inode_qid at ffffffffa0d0b03e &lt;span class=&quot;error&quot;&gt;&amp;#91;osd_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
#22 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d8a8&amp;#93;&lt;/span&gt; osd_declare_write_commit at ffffffffa0cfc3d1 &lt;span class=&quot;error&quot;&gt;&amp;#91;osd_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
#23 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d948&amp;#93;&lt;/span&gt; ofd_commitrw_write at ffffffffa0dc1a93 &lt;span class=&quot;error&quot;&gt;&amp;#91;ofd&amp;#93;&lt;/span&gt;&lt;br/&gt;
#24 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7d9d8&amp;#93;&lt;/span&gt; ofd_commitrw at ffffffffa0dc4abd &lt;span class=&quot;error&quot;&gt;&amp;#91;ofd&amp;#93;&lt;/span&gt;&lt;br/&gt;
#25 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7da68&amp;#93;&lt;/span&gt; obd_commitrw at ffffffffa0d791d8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
#26 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7dae8&amp;#93;&lt;/span&gt; ost_brw_write at ffffffffa0d831d1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
#27 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7dc78&amp;#93;&lt;/span&gt; ost_handle at ffffffffa0d8942b &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
#28 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7ddb8&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa0707428 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#29 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7deb8&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa07087be &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#30 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880efef7df48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100c0ca&lt;/p&gt;</comment>
                            <comment id="74214" author="di.wang" created="Wed, 1 Jan 2014 06:48:48 +0000"  >&lt;p&gt;hmm, I think this OSS crash is a different issue, you probably need open a new ticket for this.&lt;/p&gt;</comment>
                            <comment id="74215" author="di.wang" created="Wed, 1 Jan 2014 07:02:06 +0000"  >&lt;p&gt;Hmm, Does your lustre version includes the fix from &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4179&quot; title=&quot;LBUG ASSERTION( !lustre_handle_is_used(&amp;amp;lhc-&amp;gt;mlh_reg_lh) ) failed:&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4179&quot;&gt;&lt;del&gt;LU-4179&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;  LU-4179 mdt: skip open lock enqueue during resent

    Skip open lock enqueue, if the open lock has been
    acquired(mdt_intent_fixup_resent) during resent.

    Signed-off-by: wang di &amp;lt;di.wang@intel.com&amp;gt;
    Change-Id: I625ca438e28520416ee2af884d0a9f9e6f21cf2e
    Reviewed-on: http://review.whamcloud.com/8173
    Tested-by: Jenkins
    Tested-by: Maloo &amp;lt;hpdd-maloo@intel.com&amp;gt;
    Reviewed-by: Oleg Drokin &amp;lt;oleg.drokin@intel.com&amp;gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;and &lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;    LU-3273 mdt: Hold med_open_lock before walking med_open_head
    
    Fixed a bug where during replay mdt_mfd_open() calls mdt_handle2mfd()
    without acquiring the med_open_lock.
    We now take the med_open_lock before traversing med_open_head list.
    This bug was noticed during the analysis of LU-3233.
    
    Signed-off-by: Swapnil Pimpale &amp;lt;spimpale@ddn.com&amp;gt;
    Change-Id: Ib879f65d41d35f266897e8961dac78e6c4f0d9ec
    Reviewed-on: http://review.whamcloud.com/7272
    Tested-by: Hudson
    Tested-by: Maloo &amp;lt;whamcloud.maloo@gmail.com&amp;gt;
    Reviewed-by: John L. Hammond &amp;lt;john.hammond@intel.com&amp;gt;
    Reviewed-by: Andreas Dilger &amp;lt;andreas.dilger@intel.com&amp;gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Thanks.&lt;/p&gt;</comment>
                            <comment id="74216" author="jaylan" created="Wed, 1 Jan 2014 08:18:02 +0000"  >&lt;p&gt;Peter, the patch was installed Saturday 12/28 afternoon. I do not know how frequent it crashed before. Mahmoud would know better.&lt;/p&gt;

&lt;p&gt;Di, the source is at &lt;a href=&quot;https://github.com/jlan/lustre-nas/commits/nas-2.4.0-1&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://github.com/jlan/lustre-nas/commits/nas-2.4.0-1&lt;/a&gt;.&lt;br/&gt;
The relevant branch is nas-2.4.0-1. The build included commits up to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4403&quot; title=&quot;ASSERTION( lock-&amp;gt;l_readers &amp;gt; 0 )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4403&quot;&gt;&lt;del&gt;LU-4403&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;We do have &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4179&quot; title=&quot;LBUG ASSERTION( !lustre_handle_is_used(&amp;amp;lhc-&amp;gt;mlh_reg_lh) ) failed:&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4179&quot;&gt;&lt;del&gt;LU-4179&lt;/del&gt;&lt;/a&gt;, but not &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3273&quot; title=&quot;mdt_mfd_open() may call mdt_handle2mfd() w/o holding med_open_lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3273&quot;&gt;&lt;del&gt;LU-3273&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="74227" author="di.wang" created="Thu, 2 Jan 2014 07:33:34 +0000"  >&lt;p&gt;Mahmoud, Could you please trace to the source code which line this &quot;&lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e05a5c&amp;gt;&amp;#93;&lt;/span&gt; mdt_object_open_unlock+0xac/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&quot; refers to?&lt;/p&gt;</comment>
                            <comment id="74248" author="mhanafi" created="Thu, 2 Jan 2014 17:05:41 +0000"  >&lt;p&gt;FILE: mdt_open.c&lt;br/&gt;
int mdt_reint_open(struct mdt_thread_info *info, struct mdt_lock_handle *lhc)&lt;br/&gt;
{&lt;br/&gt;
.&lt;br/&gt;
.&lt;br/&gt;
out_child:&lt;br/&gt;
    mdt_object_open_unlock(info, child, lhc, ibits, result); &amp;lt;+++++++++++++++++++++++++++++++ THIS LINE 1733&lt;br/&gt;
        mdt_object_put(info-&amp;gt;mti_env, child);&lt;br/&gt;
out_parent:&lt;br/&gt;
        mdt_object_unlock_put(info, parent, lh, result || !created);&lt;br/&gt;
out:&lt;br/&gt;
    if (result)&lt;br/&gt;
        lustre_msg_set_transno(req-&amp;gt;rq_repmsg, 0);&lt;br/&gt;
    return result;&lt;br/&gt;
}&lt;/p&gt;

&lt;p&gt;crash&amp;gt; bt -l&lt;br/&gt;
PID: 5707   TASK: ffff880824046080  CPU: 16  COMMAND: &quot;mdt00_005&quot;&lt;br/&gt;
 #0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a74c8&amp;#93;&lt;/span&gt; machine_kexec at ffffffff81035d2b&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/arch/x86/kernel/machine_kexec_64.c: 336&lt;br/&gt;
 #1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7528&amp;#93;&lt;/span&gt; crash_kexec at ffffffff810c0412&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/kernel/kexec.c: 1121&lt;br/&gt;
 #2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a75f8&amp;#93;&lt;/span&gt; kdb_kdump_check at ffffffff81285507&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/kdb/kdbmain.c: 1214&lt;br/&gt;
 #3 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7608&amp;#93;&lt;/span&gt; kdb_main_loop at ffffffff812886f7&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/kdb/kdbmain.c: 1322&lt;br/&gt;
 #4 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7718&amp;#93;&lt;/span&gt; kdb_save_running at ffffffff8128285e&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/kdb/kdbsupport.c: 798&lt;br/&gt;
 #5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7728&amp;#93;&lt;/span&gt; kdba_main_loop at ffffffff81463518&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/arch/x86/kdb/kdba_support.c: 980&lt;br/&gt;
 #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7768&amp;#93;&lt;/span&gt; kdb at ffffffff812859f6&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/kdb/kdbmain.c: 2165&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a77d8&amp;#93;&lt;/span&gt; panic at ffffffff8153e8fb&lt;br/&gt;
    /usr/src/debug/kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/kernel/panic.c: 117&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7858&amp;#93;&lt;/span&gt; lbug_with_loc at ffffffffa0414eeb &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7878&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal_nolock at ffffffffa06b03b2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7898&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal at ffffffffa06b4aad &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a78f8&amp;#93;&lt;/span&gt; ldlm_lock_decref at ffffffffa06b5f69 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7928&amp;#93;&lt;/span&gt; mdt_save_lock at ffffffffa0c6d4a3 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_handler.c: 2711&lt;br/&gt;
#13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7978&amp;#93;&lt;/span&gt; mdt_object_unlock at ffffffffa0c6d79c &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_handler.c: 2737&lt;br/&gt;
#14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a79a8&amp;#93;&lt;/span&gt; mdt_object_open_unlock at ffffffffa0c9ba5c &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_open.c: 1270&lt;br/&gt;
#15 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a79f8&amp;#93;&lt;/span&gt; mdt_reint_open at ffffffffa0ca29c4 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_open.c: 1734&lt;br/&gt;
#16 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7ae8&amp;#93;&lt;/span&gt; mdt_reconstruct_open at ffffffffa0ca435c &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/libcfs/include/libcfs/libcfs_debug.h: 211&lt;br/&gt;
#17 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7b78&amp;#93;&lt;/span&gt; mdt_reconstruct at ffffffffa0c971a5 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/libcfs/include/libcfs/libcfs_debug.h: 211&lt;br/&gt;
#18 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7b98&amp;#93;&lt;/span&gt; mdt_reint_internal at ffffffffa0c72d0b &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/libcfs/include/libcfs/libcfs_debug.h: 211&lt;br/&gt;
#19 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7bd8&amp;#93;&lt;/span&gt; mdt_intent_reint at ffffffffa0c7309d &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_handler.c: 3828&lt;br/&gt;
#20 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7c28&amp;#93;&lt;/span&gt; mdt_intent_policy at ffffffffa0c70f4e &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/libcfs/include/libcfs/libcfs_debug.h: 211&lt;br/&gt;
#21 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7c68&amp;#93;&lt;/span&gt; ldlm_lock_enqueue at ffffffffa06b27e1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#22 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7cc8&amp;#93;&lt;/span&gt; ldlm_handle_enqueue0 at ffffffffa06d924f &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#23 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7d38&amp;#93;&lt;/span&gt; mdt_enqueue at ffffffffa0c713d6 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_handler.c: 2283&lt;br/&gt;
#24 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7d58&amp;#93;&lt;/span&gt; mdt_handle_common at ffffffffa0c78787 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/mdt_handler.c: 3040&lt;br/&gt;
#25 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7da8&amp;#93;&lt;/span&gt; mds_regular_handle at ffffffffa0cb12c5 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
    /usr/src/debug/lustre-2.4.0/lustre/mdt/out_handler.c: 1031&lt;br/&gt;
#26 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7db8&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa070b428 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#27 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7eb8&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa070c7be &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#28 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88068a5a7f48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100c0ca&lt;br/&gt;
    /usr/src/debug////////kernel-lustre240-2.6.32-358.6.2.el6/linux-2.6.32-358.6.2.el6.20130607.x86_64/arch/x86/kernel/entry_64.S: 1213&lt;/p&gt;
</comment>
                            <comment id="74274" author="di.wang" created="Thu, 2 Jan 2014 21:42:39 +0000"  >&lt;p&gt;Thanks! Mahmoud.  It seems in 2.4, MDS will enqueue the open lock anyway, and if the client does not require the open lock, MDT will release the lock later. It is different as b2_1, which only enqueue the open lock if the client requires it. (probably brought in by layout lock patch?).  Anyway, this change will add some &quot;local&quot; open lock to the export hash list, which will trigger this problem. I will post a patch soon.  &lt;/p&gt;</comment>
                            <comment id="74278" author="di.wang" created="Thu, 2 Jan 2014 22:22:47 +0000"  >&lt;p&gt;Ok, I just updated the patch.&lt;/p&gt;

&lt;p&gt;b2_4 &lt;a href=&quot;http://review.whamcloud.com/8642&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8642&lt;/a&gt;&lt;br/&gt;
master &lt;a href=&quot;http://review.whamcloud.com/8680&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8680&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="74313" author="jaylan" created="Fri, 3 Jan 2014 18:48:45 +0000"  >&lt;p&gt;Di, is &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3273&quot; title=&quot;mdt_mfd_open() may call mdt_handle2mfd() w/o holding med_open_lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3273&quot;&gt;&lt;del&gt;LU-3273&lt;/del&gt;&lt;/a&gt; related to this problem? &lt;/p&gt;</comment>
                            <comment id="74319" author="di.wang" created="Fri, 3 Jan 2014 22:30:22 +0000"  >&lt;p&gt;Jay, probably no, the patch here should be enough for this problem. Btw: Did you create a new ticket for the crash you find on OSS?&lt;/p&gt;</comment>
                            <comment id="74440" author="mhanafi" created="Mon, 6 Jan 2014 23:45:48 +0000"  >&lt;p&gt;We installed the latest version of the patch. It still crashed 2 times after the update. We now know what is causing this. A user is using hdf5 to do parallel writes to 1 file from ~2000 process. I am working on getting a reproducer.&lt;/p&gt;

&lt;p&gt;The new crashes were exactly the same.&lt;/p&gt;
</comment>
                            <comment id="74450" author="di.wang" created="Tue, 7 Jan 2014 00:24:30 +0000"  >&lt;p&gt;Interesting. Hmm, if you can reproduce this on a test system and collecting some debug log when crash happened, it would be very helpful. Thanks.&lt;/p&gt;</comment>
                            <comment id="74514" author="mhanafi" created="Tue, 7 Jan 2014 20:53:42 +0000"  >&lt;p&gt;Which debug log would you like for me to collect. Since the system drops to kdb as soon as we hit the LBUG we need a way to collect those logs.&lt;/p&gt;
</comment>
                            <comment id="74519" author="di.wang" created="Tue, 7 Jan 2014 21:57:04 +0000"  >&lt;p&gt;You can disable panic_on_lbug on MDS (lctl set_param panic_on_lbug=0), then if LBUG happens, the system will dump the debug log somewhere automatically (you can see this in console message).  And also if you can set debug level to -1 (lctl set_param debug=-1) and debug size to 20 (lctl set_param debug_size=30) on MDS, that would make sure the debug log include enough information we need during LBUG, but this parameter changes(debug and debug_size) will slow down your system, please be aware of this.&lt;/p&gt;</comment>
                            <comment id="74523" author="jay" created="Tue, 7 Jan 2014 23:43:21 +0000"  >&lt;p&gt;Hi Mahmoud,&lt;/p&gt;

&lt;p&gt;will you please tell me what&apos;s the tip of your branch in your comment at:&lt;/p&gt;

&lt;p&gt;&quot;Mahmoud Hanafi added a comment - 02/Jan/14 9:05 AM&quot;&lt;/p&gt;

&lt;p&gt;Jinshan&lt;/p&gt;</comment>
                            <comment id="74525" author="jay" created="Tue, 7 Jan 2014 23:47:15 +0000"  >&lt;p&gt;Just a quick update, will you try the patch below to see if I have some good luck here:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;[jinxiong@intel nasa]$ git diff
diff --git a/lustre/mdt/mdt_open.c b/lustre/mdt/mdt_open.c
index 545507f..f2a23ee 100644
--- a/lustre/mdt/mdt_open.c
+++ b/lustre/mdt/mdt_open.c
@@ -1437,7 +1437,7 @@ &lt;span class=&quot;code-object&quot;&gt;int&lt;/span&gt; mdt_reint_open(struct mdt_thread_info *info, struct mdt_lock_handle *lhc)
         struct lu_fid           *child_fid = &amp;amp;info-&amp;gt;mti_tmp_fid1;
         struct md_attr          *ma = &amp;amp;info-&amp;gt;mti_attr;
         __u64                    create_flags = info-&amp;gt;mti_spec.sp_cr_flags;
-       __u64                    ibits;
+       __u64                    ibits = 0;
         struct mdt_reint_record *rr = &amp;amp;info-&amp;gt;mti_rr;
         struct lu_name          *lname;
         &lt;span class=&quot;code-object&quot;&gt;int&lt;/span&gt;                      result, rc;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="74526" author="jay" created="Tue, 7 Jan 2014 23:50:45 +0000"  >&lt;p&gt;obviously ibits is not initialized in this case and it caused the lock in @lhc is dropped which we don&apos;t hold any references.&lt;/p&gt;</comment>
                            <comment id="74529" author="di.wang" created="Wed, 8 Jan 2014 00:02:58 +0000"  >&lt;p&gt;Ah, good catch. Jinshan. Really missed this.&lt;/p&gt;</comment>
                            <comment id="74530" author="mhanafi" created="Wed, 8 Jan 2014 00:14:23 +0000"  >&lt;p&gt;I have attached mdt_thread_info structure from the dump. It may help...&lt;/p&gt;</comment>
                            <comment id="74531" author="di.wang" created="Wed, 8 Jan 2014 00:14:26 +0000"  >&lt;p&gt;Mahmoud: please try the update patch &lt;a href=&quot;http://review.whamcloud.com/#/c/8642/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/8642/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="74593" author="jay" created="Wed, 8 Jan 2014 19:59:04 +0000"  >&lt;p&gt;patch &lt;a href=&quot;http://review.whamcloud.com/6511&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/6511&lt;/a&gt; already fixed this problem. Worth trying this alone if you guys have a chance.&lt;/p&gt;</comment>
                            <comment id="74962" author="jay" created="Tue, 14 Jan 2014 21:58:48 +0000"  >&lt;p&gt;drop the priority as there is no response from customer meanwhile I believe we&apos;ve found the root cause of this issue.&lt;/p&gt;</comment>
                            <comment id="74973" author="jaylan" created="Tue, 14 Jan 2014 23:19:32 +0000"  >&lt;p&gt;We had #8642 patch set 5 installed on Jan 8th. Yesterday morning the mds crashed (patch set 4) and booted up with patch set 5. &lt;/p&gt;

&lt;p&gt;Today early morning the mds crashed again; however, it was caused by another bug in OSS and the OSS crash brought down the mds. So, we have patch set 5 running for &amp;gt; 1 day without hitting this problem. We will let it soak more time.&lt;/p&gt;</comment>
                            <comment id="74977" author="jay" created="Wed, 15 Jan 2014 01:00:33 +0000"  >&lt;p&gt;thanks for the update Jay and good luck with patch set 5.&lt;/p&gt;</comment>
                            <comment id="75814" author="mhanafi" created="Tue, 28 Jan 2014 22:48:24 +0000"  >&lt;p&gt;Patch set 5 didn&apos;t fix the issue. We just hit this bug again.&lt;/p&gt;

&lt;p&gt;LustreError: 45299:0:(ldlm_lock.c:851:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&amp;gt;l_readers &amp;gt; 0 ) failed: &lt;br/&gt;
LustreError: 45299:0:(ldlm_lock.c:851:ldlm_lock_decref_internal_nolock()) LBUG&lt;br/&gt;
Pid: 45299, comm: mdt02_087&lt;/p&gt;

&lt;p&gt;PID: 20719  TASK: ffff880368864aa0  CPU: 24  COMMAND: &quot;mdt01_059&quot;&lt;br/&gt;
 #0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c5394c8&amp;#93;&lt;/span&gt; machine_kexec at ffffffff81035e8b&lt;br/&gt;
 #1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539528&amp;#93;&lt;/span&gt; crash_kexec at ffffffff810c0492&lt;br/&gt;
 #2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c5395f8&amp;#93;&lt;/span&gt; kdb_kdump_check at ffffffff812858d7&lt;br/&gt;
 #3 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539608&amp;#93;&lt;/span&gt; kdb_main_loop at ffffffff81288ac7&lt;br/&gt;
 #4 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539718&amp;#93;&lt;/span&gt; kdb_save_running at ffffffff81282c2e&lt;br/&gt;
 #5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539728&amp;#93;&lt;/span&gt; kdba_main_loop at ffffffff81463988&lt;br/&gt;
 #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539768&amp;#93;&lt;/span&gt; kdb at ffffffff81285dc6&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c5397d8&amp;#93;&lt;/span&gt; panic at ffffffff8153efbf&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539858&amp;#93;&lt;/span&gt; lbug_with_loc at ffffffffa045deeb &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539878&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal_nolock at ffffffffa0706402 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539898&amp;#93;&lt;/span&gt; ldlm_lock_decref_internal at ffffffffa070aafd &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c5398f8&amp;#93;&lt;/span&gt; ldlm_lock_decref at ffffffffa070bfb9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539928&amp;#93;&lt;/span&gt; mdt_save_lock at ffffffffa0e3c483 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539978&amp;#93;&lt;/span&gt; mdt_object_unlock at ffffffffa0e3c77c &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c5399a8&amp;#93;&lt;/span&gt; mdt_object_open_unlock at ffffffffa0e6acfc &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#15 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c5399f8&amp;#93;&lt;/span&gt; mdt_reint_open at ffffffffa0e71d14 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#16 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539ae8&amp;#93;&lt;/span&gt; mdt_reconstruct_open at ffffffffa0e736ac &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#17 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539b78&amp;#93;&lt;/span&gt; mdt_reconstruct at ffffffffa0e66445 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#18 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539b98&amp;#93;&lt;/span&gt; mdt_reint_internal at ffffffffa0e41cfb &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#19 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539bd8&amp;#93;&lt;/span&gt; mdt_intent_reint at ffffffffa0e42090 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#20 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539c28&amp;#93;&lt;/span&gt; mdt_intent_policy at ffffffffa0e3ff3e &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#21 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539c68&amp;#93;&lt;/span&gt; ldlm_lock_enqueue at ffffffffa0708831 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#22 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539cc8&amp;#93;&lt;/span&gt; ldlm_handle_enqueue0 at ffffffffa072f1ef &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#23 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539d38&amp;#93;&lt;/span&gt; mdt_enqueue at ffffffffa0e403c6 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#24 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539d58&amp;#93;&lt;/span&gt; mdt_handle_common at ffffffffa0e46ad7 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#25 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539da8&amp;#93;&lt;/span&gt; mds_regular_handle at ffffffffa0e80615 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
#26 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539db8&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa07613c8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#27 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539eb8&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa076275e &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
#28 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88036c539f48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100c0ca&lt;/p&gt;</comment>
                            <comment id="75818" author="jay" created="Tue, 28 Jan 2014 23:23:37 +0000"  >&lt;p&gt;Can you share me the following info:&lt;br/&gt;
1. Comparing to the previous patches, did it last longer after applying patch set 5?&lt;br/&gt;
2. what&apos;s the tip of the source tree you&apos;re running?&lt;/p&gt;

&lt;p&gt;Jinshan&lt;/p&gt;</comment>
                            <comment id="75819" author="jaylan" created="Tue, 28 Jan 2014 23:30:47 +0000"  >&lt;p&gt;My bad. The patch set #5 was in my nas-2.4.0-1 branch, but not&lt;br/&gt;
in nas-2.4.1 branch. It was an earlier patch in nas-2.4.1 branch.&lt;/p&gt;

&lt;p&gt;We just upgraded our server to 2.4.1 yesterday.&lt;/p&gt;</comment>
                            <comment id="76540" author="pjones" created="Sat, 8 Feb 2014 05:32:12 +0000"  >&lt;p&gt;Patch landed for 2.6&lt;/p&gt;</comment>
                            <comment id="76802" author="javed" created="Wed, 12 Feb 2014 03:24:22 +0000"  >&lt;p&gt;just fyi, we were hit on 9th feb...i&apos;ve attached the mds.log. &lt;br/&gt;
this is on lustre 2.4.2, haven&apos;t patched yet.&lt;/p&gt;</comment>
                            <comment id="81964" author="jamesanunez" created="Fri, 18 Apr 2014 17:05:45 +0000"  >&lt;p&gt;Patch for b2_5 at &lt;a href=&quot;http://review.whamcloud.com/#/c/9779/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/9779/&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="14093" name="mds.log" size="6033" author="javed" created="Wed, 12 Feb 2014 03:23:51 +0000"/>
                            <attachment id="13963" name="mdt_thread_info.dump" size="52574" author="mhanafi" created="Wed, 8 Jan 2014 00:14:55 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwbpj:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>12085</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>