<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:50:35 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-5333] rm cause MDS to complain hung tasks and disconnecting clients</title>
                <link>https://jira.whamcloud.com/browse/LU-5333</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;A client was running &quot;rm&quot; to remove a couple of million files when MDS system load shot to 30 and kernel trace dumping complaining hung tasks - See attached output from &quot;dmesg&quot;&lt;/p&gt;

&lt;p&gt;I would think this is normal workload for a duo-westmere CPU / 24GB RAM bonded myricom 10Gbps system.&lt;/p&gt;

&lt;p&gt;We have been seeing happening more frequently in 2.4.3 than when we were at 1.8.7.&lt;/p&gt;

&lt;p&gt;Anything suggestion?&lt;/p&gt;

&lt;p&gt;thanks,&lt;br/&gt;
Haisong&lt;/p&gt;</description>
                <environment>Linux puma-mds-10-6.local 2.6.32-358.23.2.el6_lustre.x86_64 #1 SMP Thu Dec 19 19:57:45 PST 2013 x86_64 x86_64 x86_64 GNU/Linux&lt;br/&gt;
</environment>
        <key id="25546">LU-5333</key>
            <summary>rm cause MDS to complain hung tasks and disconnecting clients</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="niu">Niu Yawei</assignee>
                                    <reporter username="haisong">Haisong Cai</reporter>
                        <labels>
                            <label>sdsc</label>
                    </labels>
                <created>Fri, 11 Jul 2014 20:10:57 +0000</created>
                <updated>Wed, 22 Jun 2016 08:55:39 +0000</updated>
                            <resolved>Wed, 22 Jun 2016 08:55:39 +0000</resolved>
                                    <version>Lustre 2.4.3</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="88900" author="pjones" created="Sat, 12 Jul 2014 13:36:59 +0000"  >&lt;p&gt;Niu&lt;/p&gt;

&lt;p&gt;Could you please advise on this issue?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="88951" author="green" created="Mon, 14 Jul 2014 17:09:31 +0000"  >&lt;p&gt;From the traces it looks like it&apos;s a combination of OOM and journal deadlock of some sort.&lt;/p&gt;</comment>
                            <comment id="89045" author="haisong" created="Tue, 15 Jul 2014 16:13:45 +0000"  >&lt;p&gt;Hi Oleg,&lt;/p&gt;

&lt;p&gt;Later that day, the MDS came to a point where local commands were hanging. &lt;br/&gt;
We rebooted the server and ran e2fsck. That fixed a bunch quota entries and couple of inodes.&lt;/p&gt;

&lt;p&gt;It has been stable so far.&lt;/p&gt;

&lt;p&gt;Haisong&lt;/p&gt;</comment>
                            <comment id="96762" author="haisong" created="Mon, 20 Oct 2014 22:26:37 +0000"  >&lt;p&gt;We have another case where removing some several million files from filesystem caused MDS to dump stack traces and gradually hang. I will attache some stack traces and dmesg following this message. &lt;/p&gt;</comment>
                            <comment id="96764" author="haisong" created="Mon, 20 Oct 2014 22:30:26 +0000"  >&lt;p&gt;Correction: server is running 2.4.2 not 2.4.3&lt;/p&gt;</comment>
                            <comment id="97532" author="niu" created="Mon, 27 Oct 2014 09:14:05 +0000"  >&lt;p&gt;I think this could be related with &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5726&quot; title=&quot;MDS buffer not freed when deleting files&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5726&quot;&gt;&lt;del&gt;LU-5726&lt;/del&gt;&lt;/a&gt;, and &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5503&quot; title=&quot;MDS (2.4.2) are getting &amp;quot;Service thread ... inactive&amp;quot; and file-system times out&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5503&quot;&gt;&lt;del&gt;LU-5503&lt;/del&gt;&lt;/a&gt; looks another instance of such problem.&lt;/p&gt;</comment>
                            <comment id="97708" author="haisong" created="Tue, 28 Oct 2014 16:14:07 +0000"  >&lt;p&gt;Hi Yawei,&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5726&quot; title=&quot;MDS buffer not freed when deleting files&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5726&quot;&gt;&lt;del&gt;LU-5726&lt;/del&gt;&lt;/a&gt; indicates the issue is fixed in 2.7.0. &lt;br/&gt;
Could you comment on whether the fix can be back-ported into earlier versions, specifically 2.5.*?&lt;/p&gt;

&lt;p&gt;thanks,&lt;br/&gt;
Haisong&lt;/p&gt;</comment>
                            <comment id="97709" author="pjones" created="Tue, 28 Oct 2014 16:33:28 +0000"  >&lt;p&gt;Haisong&lt;/p&gt;

&lt;p&gt;To be clear &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5726&quot; title=&quot;MDS buffer not freed when deleting files&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5726&quot;&gt;&lt;del&gt;LU-5726&lt;/del&gt;&lt;/a&gt; is targeted to be fixed in the 2.7 release but is not fixed yet. Your interest in this issue will raise the priority on this work and Niu will look at the possibilities/options to backport a fix to 2.5.x as part of this effort.&lt;/p&gt;

&lt;p&gt;Regards&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="105987" author="niu" created="Fri, 6 Feb 2015 02:30:47 +0000"  >&lt;p&gt;b2_5 port: &lt;a href=&quot;http://review.whamcloud.com/#/c/13464/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/13464/&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="26970">LU-5726</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="26061">LU-5503</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="16016" name="dmesg.3369" size="460854" author="haisong" created="Mon, 20 Oct 2014 22:29:44 +0000"/>
                            <attachment id="15370" name="dmesg_log" size="57807" author="haisong" created="Fri, 11 Jul 2014 20:10:57 +0000"/>
                            <attachment id="16017" name="lustre-log.tgz" size="1725308" author="haisong" created="Mon, 20 Oct 2014 22:29:44 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10490" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>End date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Fri, 6 Feb 2015 20:10:57 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwr8v:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>14881</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10021"><![CDATA[2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10493" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>Start date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Fri, 11 Jul 2014 20:10:57 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                    </customfields>
    </item>
</channel>
</rss>