<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:12:15 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-7825] ldlm_lock.c:810:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&gt;l_writers &gt; 0</title>
                <link>https://jira.whamcloud.com/browse/LU-7825</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Error happens during soak testing of build &apos;20160224&apos; (b2_8 RC2) (see:&lt;br/&gt;
&lt;a href=&quot;https://wiki.hpdd.intel.com/pages/viewpage.action?title=Soak+Testing+on+Lola&amp;amp;&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://wiki.hpdd.intel.com/pages/viewpage.action?title=Soak+Testing+on+Lola&amp;amp;&lt;/a&gt; spaceKey=Releases#SoakTestingonLola-20150224). DNE is enabled.&lt;br/&gt;
MDSes had been formatted using ldiskfs, OSTs using zfs. MDSes are configured in active-active HA failover configuration.&lt;/p&gt;

&lt;p&gt;Sequence of events:&lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;2016-02-27 02:04:02,121:fsmgmt.fsmgmt:INFO     mds_failover just completed (lola-10 ---&amp;gt; lola-11)&lt;/li&gt;
	&lt;li&gt;Feb 27 02:06:44 lola-10 kernel: Lustre: soaked-MDT0005: Recovery over after 2:42, of 16 clients 14 recovered and 2 were evicted.&lt;/li&gt;
	&lt;li&gt;Feb 27 02:12:06 lola-10 kernel: Lustre: soaked-MDT0004: Recovery over after 8:02, of 16 clients 11 recovered and 5 were evicted.&lt;/li&gt;
	&lt;li&gt;2016-02-27 02:12:58 lola-9 (different HA pair) crashed&lt;/li&gt;
&lt;/ul&gt;


&lt;p&gt;The error reads as:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;&amp;lt;0&amp;gt;LustreError: 5003:0:(ldlm_lock.c:810:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&amp;gt;l_writers &amp;gt; 0 ) failed: 
&amp;lt;0&amp;gt;LustreError: 5003:0:(ldlm_lock.c:810:ldlm_lock_decref_internal_nolock()) LBUG
&amp;lt;4&amp;gt;Pid: 5003, comm: mdt02_007
&amp;lt;4&amp;gt;
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0748875&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0748e77&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a2ef0f&amp;gt;] ldlm_lock_decref_internal_nolock+0x17f/0x180 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a3102d&amp;gt;] ldlm_lock_decref_internal+0x4d/0xa80 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa083f935&amp;gt;] ? class_handle2object+0x95/0x190 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a325a0&amp;gt;] ldlm_lock_decref_and_cancel+0x80/0x150 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa1164c67&amp;gt;] mdt_object_unlock+0xa7/0x2e0 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa11867ca&amp;gt;] mdt_reint_rename_or_migrate+0xf3a/0x2600 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0ab7bdd&amp;gt;] ? null_alloc_rs+0xcd/0x320 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0876cbc&amp;gt;] ? upcall_cache_get_entry+0x29c/0x880 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa087bbf0&amp;gt;] ? lu_ucred+0x20/0x30 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a7d100&amp;gt;] ? lustre_pack_reply_v2+0x180/0x280 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa117d50f&amp;gt;] ? ucred_set_jobid+0x5f/0x70 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa1187ec3&amp;gt;] mdt_reint_rename+0x13/0x20 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa118118d&amp;gt;] mdt_reint_rec+0x5d/0x200 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa116cddb&amp;gt;] mdt_reint_internal+0x62b/0x9f0 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa116d63b&amp;gt;] mdt_reint+0x6b/0x120 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0ae0c2c&amp;gt;] tgt_request_handle+0x8ec/0x1440 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a8dc61&amp;gt;] ptlrpc_main+0xd21/0x1800 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8152a39e&amp;gt;] ? thread_return+0x4e/0x7d0
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a8cf40&amp;gt;] ? ptlrpc_main+0x0/0x1800 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8109e78e&amp;gt;] kthread+0x9e/0xc0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c28a&amp;gt;] child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8109e6f0&amp;gt;] ? kthread+0x0/0xc0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c280&amp;gt;] ? child_rip+0x0/0x20
&amp;lt;4&amp;gt;
&amp;lt;0&amp;gt;Kernel panic - not syncing: LBUG
&amp;lt;4&amp;gt;Pid: 5003, comm: mdt02_007 Tainted: P           ---------------    2.6.32-504.30.3.el6_lustre.x86_64 #1
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffff81529c9c&amp;gt;] ? panic+0xa7/0x16f
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0748ecb&amp;gt;] ? lbug_with_loc+0x9b/0xb0 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a2ef0f&amp;gt;] ? ldlm_lock_decref_internal_nolock+0x17f/0x180 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a3102d&amp;gt;] ? ldlm_lock_decref_internal+0x4d/0xa80 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa083f935&amp;gt;] ? class_handle2object+0x95/0x190 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a325a0&amp;gt;] ? ldlm_lock_decref_and_cancel+0x80/0x150 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa1164c67&amp;gt;] ? mdt_object_unlock+0xa7/0x2e0 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa11867ca&amp;gt;] ? mdt_reint_rename_or_migrate+0xf3a/0x2600 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0ab7bdd&amp;gt;] ? null_alloc_rs+0xcd/0x320 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0876cbc&amp;gt;] ? upcall_cache_get_entry+0x29c/0x880 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa087bbf0&amp;gt;] ? lu_ucred+0x20/0x30 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a7d100&amp;gt;] ? lustre_pack_reply_v2+0x180/0x280 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa117d50f&amp;gt;] ? ucred_set_jobid+0x5f/0x70 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa1187ec3&amp;gt;] ? mdt_reint_rename+0x13/0x20 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa118118d&amp;gt;] ? mdt_reint_rec+0x5d/0x200 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa116cddb&amp;gt;] ? mdt_reint_internal+0x62b/0x9f0 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa116d63b&amp;gt;] ? mdt_reint+0x6b/0x120 [mdt]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0ae0c2c&amp;gt;] ? tgt_request_handle+0x8ec/0x1440 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a8dc61&amp;gt;] ? ptlrpc_main+0xd21/0x1800 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8152a39e&amp;gt;] ? thread_return+0x4e/0x7d0
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a8cf40&amp;gt;] ? ptlrpc_main+0x0/0x1800 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8109e78e&amp;gt;] ? kthread+0x9e/0xc0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c28a&amp;gt;] ? child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8109e6f0&amp;gt;] ? kthread+0x0/0xc0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c280&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Attached message, console logs of MDS nodes &lt;tt&gt;lola-9&lt;/tt&gt;, &lt;tt&gt;lola-10&lt;/tt&gt; and also vmcore-dmesg.txt. &lt;br/&gt;
Crash file will be saved separately.&lt;/p&gt;</description>
                <environment>lola&lt;br/&gt;
build: &lt;a href=&quot;https://build.hpdd.intel.com/job/lustre-b2_8/8/&quot;&gt;https://build.hpdd.intel.com/job/lustre-b2_8/8/&lt;/a&gt;</environment>
        <key id="35029">LU-7825</key>
            <summary>ldlm_lock.c:810:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&gt;l_writers &gt; 0</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="di.wang">Di Wang</assignee>
                                    <reporter username="heckes">Frank Heckes</reporter>
                        <labels>
                            <label>soak</label>
                    </labels>
                <created>Sat, 27 Feb 2016 10:48:40 +0000</created>
                <updated>Wed, 16 Mar 2016 03:41:17 +0000</updated>
                            <resolved>Wed, 16 Mar 2016 03:40:14 +0000</resolved>
                                    <version>Lustre 2.8.0</version>
                                    <fixVersion>Lustre 2.8.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="144061" author="heckes" created="Sat, 27 Feb 2016 11:00:41 +0000"  >&lt;p&gt;The crash file has been saved at &lt;tt&gt;lhn.hpdd.intel.com:/scratch/crashdumps/lu-7825/lola-9/127.0.0.1-2016-02-27-02\:12\:58/&lt;/tt&gt;.&lt;/p&gt;</comment>
                            <comment id="144069" author="di.wang" created="Sat, 27 Feb 2016 19:18:52 +0000"  >&lt;p&gt;Hmm, it looks like lock is not released correctly in the error handler path of mdt_reint_rename_internal(). will cook a patch.&lt;/p&gt;</comment>
                            <comment id="144070" author="gerrit" created="Sat, 27 Feb 2016 19:24:30 +0000"  >&lt;p&gt;wangdi (di.wang@intel.com) uploaded a new patch: &lt;a href=&quot;http://review.whamcloud.com/18707&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/18707&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-7825&quot; title=&quot;ldlm_lock.c:810:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&amp;gt;l_writers &amp;gt; 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-7825&quot;&gt;&lt;del&gt;LU-7825&lt;/del&gt;&lt;/a&gt; mdt: release parent lock correctly for rename&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 6a240c713c30cd5b167d32e5c2a163f6b18d8ef6&lt;/p&gt;</comment>
                            <comment id="144285" author="gerrit" created="Tue, 1 Mar 2016 13:20:56 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;http://review.whamcloud.com/18707/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/18707/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-7825&quot; title=&quot;ldlm_lock.c:810:ldlm_lock_decref_internal_nolock()) ASSERTION( lock-&amp;gt;l_writers &amp;gt; 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-7825&quot;&gt;&lt;del&gt;LU-7825&lt;/del&gt;&lt;/a&gt; mdt: release parent lock correctly for rename&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 30ece848c046dda5c450dc49c6b146360c077a22&lt;/p&gt;</comment>
                            <comment id="145692" author="jgmitter" created="Wed, 16 Mar 2016 03:40:14 +0000"  >&lt;p&gt;Landed to master and b2_8.  Is present in the 2.8.0 release.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="20587" name="console-lola-10.log.bz2" size="401899" author="heckes" created="Sat, 27 Feb 2016 10:57:27 +0000"/>
                            <attachment id="20586" name="console-lola-9.log.bz2" size="622631" author="heckes" created="Sat, 27 Feb 2016 10:57:27 +0000"/>
                            <attachment id="20588" name="lola-9-vmcore-dmesg.txt.bz2" size="35077" author="heckes" created="Sat, 27 Feb 2016 10:57:27 +0000"/>
                            <attachment id="20590" name="messages-lola-10.log.bz2" size="317755" author="heckes" created="Sat, 27 Feb 2016 10:57:27 +0000"/>
                            <attachment id="20589" name="messages-lola-9.log.bz2" size="276259" author="heckes" created="Sat, 27 Feb 2016 10:57:27 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzy32n:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>