<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:13:23 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1087] mdt thread spinning out of control</title>
                <link>https://jira.whamcloud.com/browse/LU-1087</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;On one of our filesystems that was upgraded to lustre 2.1 last week, the MDS has one thread that appears to be stick spinning:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;13711 root      20   0     0    0    0 R 99.9  0.0   6289:28 mdt_253
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Using sysreq (since crash can&apos;t trace a live process):&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;2012-02-09 16:18:39 Call Trace:
2012-02-09 16:18:39  [&amp;lt;ffffffffa06de440&amp;gt;] ? ldlm_cancel_locks_for_export_cb+0x0/0xd0 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa06de440&amp;gt;] ? ldlm_cancel_locks_for_export_cb+0x0/0xd0 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0498f46&amp;gt;] cfs_hash_for_each_empty+0xc6/0x170 [libcfs]
2012-02-09 16:18:39  [&amp;lt;ffffffffa06db15f&amp;gt;] ldlm_cancel_locks_for_export+0x1f/0x30 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa06e7c94&amp;gt;] server_disconnect_export+0x64/0x170 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0c50dcb&amp;gt;] mdt_obd_disconnect+0x4b/0xd50 [mdt]
2012-02-09 16:18:39  [&amp;lt;ffffffffa071681e&amp;gt;] ? lustre_pack_reply_flags+0xae/0x1b0 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0716931&amp;gt;] ? lustre_pack_reply+0x11/0x20 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa06e4d4a&amp;gt;] target_handle_disconnect+0x16a/0x3a0 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0c4a805&amp;gt;] mdt_disconnect+0x35/0x100 [mdt]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0c4674d&amp;gt;] mdt_handle_common+0x73d/0x12b0 [mdt]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0717334&amp;gt;] ? lustre_msg_get_transno+0x54/0x90 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0c47395&amp;gt;] mdt_regular_handle+0x15/0x20 [mdt]
2012-02-09 16:18:39  [&amp;lt;ffffffffa0723181&amp;gt;] ptlrpc_main+0xcd1/0x1690 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa07224b0&amp;gt;] ? ptlrpc_main+0x0/0x1690 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffff8100c14a&amp;gt;] child_rip+0xa/0x20
2012-02-09 16:18:39  [&amp;lt;ffffffffa07224b0&amp;gt;] ? ptlrpc_main+0x0/0x1690 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffffa07224b0&amp;gt;] ? ptlrpc_main+0x0/0x1690 [ptlrpc]
2012-02-09 16:18:39  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>lustre 2.1.0-21chaos (github.com/chaos/lustre)</environment>
        <key id="13146">LU-1087</key>
            <summary>mdt thread spinning out of control</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="morrone">Christopher Morrone</reporter>
                        <labels>
                    </labels>
                <created>Thu, 9 Feb 2012 19:31:43 +0000</created>
                <updated>Fri, 13 Jul 2012 15:11:22 +0000</updated>
                            <resolved>Tue, 5 Jun 2012 06:04:06 +0000</resolved>
                                    <version>Lustre 2.1.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="28322" author="morrone" created="Thu, 9 Feb 2012 20:09:11 +0000"  >&lt;p&gt;Excerpt from the log for the spinning thread, showing it repeatedly trying to free the same hash:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00010000:00000040:15.0:1328835885.126894:0:13711:0:(ldlm_resource.c:1102:ldlm_resource_getref()) getref res: ffff88082dc5fa80 count: 2
00010000:00000040:15.0:1328835885.126895:0:13711:0:(ldlm_resource.c:1141:ldlm_resource_putref()) putref res: ffff88082dc5fa80 count: 1
00000001:00000040:15.0:1328835885.126925:0:13711:0:(hash.c:1687:cfs_hash_for_each_empty()) Try to empty hash: 60009e44-9f98-9, loop: 178108
00010000:00000040:15.0:1328835885.126957:0:13711:0:(ldlm_resource.c:1102:ldlm_resource_getref()) getref res: ffff88082dc5fa80 count: 2
00010000:00000040:15.0:1328835885.126958:0:13711:0:(ldlm_resource.c:1141:ldlm_resource_putref()) putref res: ffff88082dc5fa80 count: 1
00000001:00000040:15.0:1328835885.126988:0:13711:0:(hash.c:1687:cfs_hash_for_each_empty()) Try to empty hash: 60009e44-9f98-9, loop: 178109
00010000:00000040:15.0:1328835885.127020:0:13711:0:(ldlm_resource.c:1102:ldlm_resource_getref()) getref res: ffff88082dc5fa80 count: 2
00010000:00000040:15.0:1328835885.127022:0:13711:0:(ldlm_resource.c:1141:ldlm_resource_putref()) putref res: ffff88082dc5fa80 count: 1
00000001:00000040:15.0:1328835885.127051:0:13711:0:(hash.c:1687:cfs_hash_for_each_empty()) Try to empty hash: 60009e44-9f98-9, loop: 178110
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="28330" author="pjones" created="Thu, 9 Feb 2012 22:19:20 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="28360" author="laisiyao" created="Fri, 10 Feb 2012 11:59:17 +0000"  >&lt;p&gt;Hi Chris, did you see any error messages about ldlm lock before this happened?&lt;/p&gt;</comment>
                            <comment id="28371" author="morrone" created="Fri, 10 Feb 2012 14:04:51 +0000"  >&lt;p&gt;We saw all manner of timeouts, and reconnects, slow service warnings and just generally a lot of log traffic.  There are certainly lock callback timer expirations and other ldlm stuff happening in there.&lt;/p&gt;</comment>
                            <comment id="28862" author="laisiyao" created="Thu, 16 Feb 2012 03:44:03 +0000"  >&lt;p&gt;Chris, your log shows you&apos;ve enabled D_INFO log, could you enable D_DLMTRACE and check which lock is in the dead loop (ldlm_cancel_lock_for_export_cb() should print lock information)?&lt;/p&gt;</comment>
                            <comment id="28992" author="morrone" created="Thu, 16 Feb 2012 13:02:13 +0000"  >&lt;p&gt;If it happens again I will do that.  Unfortunately D_INFO caused &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1088&quot; title=&quot;mgs threads go nuts&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1088&quot;&gt;&lt;del&gt;LU-1088&lt;/del&gt;&lt;/a&gt;, so I was not able to get any further debugging information.&lt;/p&gt;</comment>
                            <comment id="40005" author="liang" created="Tue, 5 Jun 2012 05:31:56 +0000"  >&lt;p&gt;I&apos;ve posted a patch for review: &lt;a href=&quot;http://review.whamcloud.com/#change,3028&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,3028&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="40009" author="pjones" created="Tue, 5 Jun 2012 06:04:06 +0000"  >&lt;p&gt;This is believed to be a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1428&quot; title=&quot;MDT servrice threads spinning in cfs_hash_for_each_relax()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1428&quot;&gt;&lt;del&gt;LU-1428&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="14508">LU-1428</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvhdr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6465</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10021"><![CDATA[2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>