<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:33:13 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-3356] LBUG LustreError: 3202:0:(mds_open.c:1494:mds_mfd_close()) ASSERTION(pending_child-&gt;d_inode != NULL) failed</title>
                <link>https://jira.whamcloud.com/browse/LU-3356</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;We have now had the same LBUG twice in one month on the MDS for one of our Lustre file systems.&lt;/p&gt;

&lt;p&gt;The error in syslog on the MDS is this:&lt;/p&gt;

&lt;blockquote&gt;
&lt;p&gt;May 18 20:48:56 cs04r-sc-mds03-02 kernel: LustreError: 3202:0:(mds_open.c:1483:mds_mfd_close()) found &quot;orphan&quot; file 1621419:9595d9c8 with link count 0&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: LustreError: 3202:0:(mds_open.c:1494:mds_mfd_close()) ASSERTION(pending_child-&amp;gt;d_inode != NULL) failed&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: LustreError: 3202:0:(mds_open.c:1494:mds_mfd_close()) LBUG&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: Pid: 3202, comm: ll_mdt_rdpg_35&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel:&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: Call Trace:&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff889946a1&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x51/0x60 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88994bda&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x7a/0xd0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8899cfc0&amp;gt;&amp;#93;&lt;/span&gt; tracefile_init+0x0/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88e4cd06&amp;gt;&amp;#93;&lt;/span&gt; mds_mfd_close+0x796/0x1680 &lt;span class=&quot;error&quot;&gt;&amp;#91;mds&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff889e7121&amp;gt;&amp;#93;&lt;/span&gt; LNetMDBind+0x301/0x450 &lt;span class=&quot;error&quot;&gt;&amp;#91;lnet&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88e549f0&amp;gt;&amp;#93;&lt;/span&gt; mds_close+0x6e0/0x8d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mds&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88e27fab&amp;gt;&amp;#93;&lt;/span&gt; mds_handle+0x254b/0x4d10 &lt;span class=&quot;error&quot;&gt;&amp;#91;mds&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8008e1a4&amp;gt;&amp;#93;&lt;/span&gt; enqueue_task+0x41/0x56&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8008e20f&amp;gt;&amp;#93;&lt;/span&gt; __activate_task+0x56/0x6d&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88b05d55&amp;gt;&amp;#93;&lt;/span&gt; lustre_msg_get_conn_cnt+0x35/0xf0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88b0f6d9&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request+0x989/0xe00 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88b0fe35&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_wait_event+0x2e5/0x310 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8008cc1e&amp;gt;&amp;#93;&lt;/span&gt; __wake_up_common+0x3e/0x68&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88b10dc6&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0xf66/0x1120 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005dfb1&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x11&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff88b0fe60&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0x0/0x1120 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005dfa7&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0x0/0x11&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel:&lt;br/&gt;
May 18 20:48:56 cs04r-sc-mds03-02 kernel: LustreError: dumping log to /tmp/lustre-log.1368906536.3202&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;bnh65367@cs04r-sc-mds03-02 ~&amp;#93;&lt;/span&gt;$ cat /proc/fs/lustre/version &lt;br/&gt;
lustre: 1.8.7.80&lt;br/&gt;
kernel: patchless_client&lt;br/&gt;
build:  jenkins-gfa6b90d-PRISTINE-2.6.18-274.3.1.el5_lustre.gb18a13c&lt;/p&gt;

&lt;p&gt;This version has been running on these MDS without any problems for quite some time now. I&apos;m not entirely sure without checking why we are running this version but I believe it contains a fix for one issue we have seen frequently.&lt;/p&gt;

&lt;p&gt;Unfortunately we have so far not been able to identify any reproducer etc but after the LBUG until the fail-over today at least 4 clients were hanging on every access to the file system, other clients were fine.&lt;/p&gt;

&lt;p&gt;The logs are still available and we can upload them if it helps.&lt;/p&gt;</description>
                <environment></environment>
        <key id="19055">LU-3356</key>
            <summary>LBUG LustreError: 3202:0:(mds_open.c:1494:mds_mfd_close()) ASSERTION(pending_child-&gt;d_inode != NULL) failed</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="ferner">Frederik Ferner</reporter>
                        <labels>
                    </labels>
                <created>Sat, 18 May 2013 21:28:40 +0000</created>
                <updated>Tue, 25 Nov 2014 15:22:10 +0000</updated>
                            <resolved>Tue, 25 Nov 2014 15:22:10 +0000</resolved>
                                    <version>Lustre 1.8.7</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="58839" author="pjones" created="Sun, 19 May 2013 01:55:38 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Could you please advise on this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="58850" author="bobijam" created="Mon, 20 May 2013 01:46:42 +0000"  >&lt;p&gt;please upload the logs.&lt;/p&gt;</comment>
                            <comment id="58973" author="davebond-diamond" created="Tue, 21 May 2013 14:02:42 +0000"  >&lt;p&gt;/var/log/messages from server cs04r-sc-mds03-02&lt;/p&gt;</comment>
                            <comment id="58974" author="davebond-diamond" created="Tue, 21 May 2013 14:07:04 +0000"  >&lt;p&gt;Lustre log files for cs04r-sc-mds03-02&lt;/p&gt;</comment>
                            <comment id="59035" author="bobijam" created="Wed, 22 May 2013 07:12:16 +0000"  >&lt;p&gt;patch tracking at &lt;a href=&quot;http://review.whamcloud.com/6412&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/6412&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="59620" author="ferner" created="Thu, 30 May 2013 10:58:37 +0000"  >&lt;p&gt;I noticed the patch fails very early (in lustre-initialization-1) and the last update has been a while ago. We have a maintenance window coming up next week. If there is a patch we should start testing at least on our test file systems and maybe on the affected file systems, it would be good to have this by then.&lt;/p&gt;

&lt;p&gt;Thanks,&lt;br/&gt;
Frederik&lt;/p&gt;</comment>
                            <comment id="59624" author="bobijam" created="Thu, 30 May 2013 12:08:40 +0000"  >&lt;p&gt;the test failure is due to TT-1072 issue, I think you can test with this patch.&lt;/p&gt;</comment>
                            <comment id="59626" author="pjones" created="Thu, 30 May 2013 13:16:10 +0000"  >&lt;p&gt;Frederik&lt;/p&gt;

&lt;p&gt;The TT project is not open because it tracks configuration issues in our test lab. So, the failure itself means that the verification testing has not yet taken place rather than there is a problem with the patch.&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="100029" author="pjones" created="Tue, 25 Nov 2014 15:22:10 +0000"  >&lt;p&gt;Frederik&lt;/p&gt;

&lt;p&gt;I think that this issue is no longer relevant since your upgrade to 2.5.x&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="12888" name="lustre-logs.tar.gz" size="2861087" author="davebond-diamond" created="Tue, 21 May 2013 14:07:04 +0000"/>
                            <attachment id="12887" name="mds03-02-messages" size="320363" author="davebond-diamond" created="Tue, 21 May 2013 14:02:41 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvr9r:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>8309</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>