<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:16:15 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1395] MDS hangs after calltrace at ldlm_expired_completion_wait()</title>
                <link>https://jira.whamcloud.com/browse/LU-1395</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;We saw the following call traces on MDS and it hanged after it.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Apr 23 15:58:34 ALPL505 kernel: Call Trace:
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88953a00&amp;gt;] ldlm_expired_completion_wait+0x0/0x250 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88955542&amp;gt;] ldlm_completion_ast+0x4c2/0x880 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8893a709&amp;gt;] ldlm_lock_enqueue+0x9d9/0xb20 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8008e421&amp;gt;] default_wake_function+0x0/0xe
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88935b6a&amp;gt;] ldlm_lock_addref_internal_nolock+0x3a/0x90 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff889540bb&amp;gt;] ldlm_cli_enqueue_local+0x46b/0x520 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88caa157&amp;gt;] enqueue_ordered_locks+0x387/0x4d0 [mds]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff889519a0&amp;gt;] ldlm_blocking_ast+0x0/0x2a0 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88955080&amp;gt;] ldlm_completion_ast+0x0/0x880 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88caa8e9&amp;gt;] mds_get_parent_child_locked+0x649/0x960 [mds]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88c9b652&amp;gt;] mds_getattr_lock+0x632/0xc90 [mds]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88c96dda&amp;gt;] fixup_handle_for_resent_req+0x5a/0x2c0 [mds]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88ca1d83&amp;gt;] mds_intent_policy+0x623/0xc20 [mds]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8893c270&amp;gt;] ldlm_resource_putref_internal+0x230/0x460 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88939eb6&amp;gt;] ldlm_lock_enqueue+0x186/0xb20 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff889367fd&amp;gt;] ldlm_lock_create+0x9bd/0x9f0 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8895e870&amp;gt;] ldlm_server_blocking_ast+0x0/0x83d [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8895bb39&amp;gt;] ldlm_handle_enqueue+0xc09/0x1210 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88ca0b30&amp;gt;] mds_handle+0x40e0/0x4d10 [mds]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff800774ed&amp;gt;] smp_send_reschedule+0x4e/0x53
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8008ddcd&amp;gt;] enqueue_task+0x41/0x56
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8897fd55&amp;gt;] lustre_msg_get_conn_cnt+0x35/0xf0 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff889896d9&amp;gt;] ptlrpc_server_handle_request+0x989/0xe00 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88989e35&amp;gt;] ptlrpc_wait_event+0x2e5/0x310 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8008c85d&amp;gt;] __wake_up_common+0x3e/0x68
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8898adc6&amp;gt;] ptlrpc_main+0xf66/0x1120 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8005dfb1&amp;gt;] child_rip+0xa/0x11
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff88989e60&amp;gt;] ptlrpc_main+0x0/0x1120 [ptlrpc]
Apr 23 15:58:34 ALPL505 kernel:  [&amp;lt;ffffffff8005dfa7&amp;gt;] child_rip+0x0/0x11
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;this might be related to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-59&quot; title=&quot;call traces on MDS for ldlm_expired_completion_wait()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-59&quot;&gt;&lt;del&gt;LU-59&lt;/del&gt;&lt;/a&gt;, but please review on this.&lt;/p&gt;</description>
                <environment></environment>
        <key id="14384">LU-1395</key>
            <summary>MDS hangs after calltrace at ldlm_expired_completion_wait()</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="green">Oleg Drokin</assignee>
                                    <reporter username="ihara">Shuichi Ihara</reporter>
                        <labels>
                    </labels>
                <created>Thu, 10 May 2012 11:42:13 +0000</created>
                <updated>Mon, 29 May 2017 04:00:53 +0000</updated>
                            <resolved>Mon, 29 May 2017 04:00:53 +0000</resolved>
                                    <version>Lustre 1.8.6</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="38551" author="pjones" created="Thu, 10 May 2012 13:13:46 +0000"  >&lt;p&gt;Oleg will look into this one&lt;/p&gt;</comment>
                            <comment id="42183" author="ihara" created="Tue, 24 Jul 2012 04:04:41 +0000"  >&lt;p&gt;Hi Peter, Oleg, &lt;br/&gt;
could you plesae view on this quickly? we saw similar problems at a couple of sites.&lt;/p&gt;</comment>
                            <comment id="42191" author="green" created="Tue, 24 Jul 2012 10:14:47 +0000"  >&lt;p&gt;This trace is just a sign of client not responding to lock cancel request. It should be followed by a client being evicted.&lt;br/&gt;
We need the client log to see what was happening there, I guess.&lt;/p&gt;</comment>
                            <comment id="46769" author="kitwestneat" created="Fri, 19 Oct 2012 05:42:18 +0000"  >&lt;p&gt;This looks like a dupe of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-500&quot; title=&quot;MDS threads hang ldlm_expired_completion_wait+&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-500&quot;&gt;&lt;del&gt;LU-500&lt;/del&gt;&lt;/a&gt; and &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1269&quot; title=&quot;speed up ASTs sending&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1269&quot;&gt;&lt;del&gt;LU-1269&lt;/del&gt;&lt;/a&gt;. I think because &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1269&quot; title=&quot;speed up ASTs sending&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1269&quot;&gt;&lt;del&gt;LU-1269&lt;/del&gt;&lt;/a&gt; is marked as an improvement instead of bug, it hasn&apos;t been getting the attention it should be. It appears as if there are several different ideas for fixing the issue. Can someone take a look at it? We have been hitting this bug regularly, most recently at IU.&lt;/p&gt;</comment>
                            <comment id="197381" author="adilger" created="Mon, 29 May 2017 04:00:53 +0000"  >&lt;p&gt;Close old ticket.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="11340" name="mds_hang.tar.gz" size="222683" author="ihara" created="Thu, 10 May 2012 11:42:13 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10490" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>End date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Fri, 19 Oct 2012 11:42:13 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw1m7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>10343</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10493" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>Start date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Thu, 10 May 2012 11:42:13 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                    </customfields>
    </item>
</channel>
</rss>