<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:18:13 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-15427] Lustre client hangs under memory pressue</title>
                <link>https://jira.whamcloud.com/browse/LU-15427</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Our compute nodes have 384GB memory and 192GB swap space. When application use a lot of memory (all of 384GB and some of 192GB swap) , many processes reading/writing to Lustre enter in D state and hang and never recover. We see the below in syslog. Note - Swap never gets full.&#160;&lt;/p&gt;

&lt;p&gt;Jan &#160;3 18:26:03 spool0121 kernel: INFO: task kswapd0:510 blocked for more than 120 seconds.&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot; disables this message.&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: kswapd0 &#160; &#160; &#160; &#160; D ffffa0f83caf85e0 &#160; &#160; 0 &#160; 510 &#160; &#160; &#160;2 0x00000000&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: Call Trace:&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3387480&amp;gt;&amp;#93;&lt;/span&gt; ? bit_wait+0x50/0x50&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3389179&amp;gt;&amp;#93;&lt;/span&gt; schedule+0x29/0x70&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3386e41&amp;gt;&amp;#93;&lt;/span&gt; schedule_timeout+0x221/0x2d0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc152111c&amp;gt;&amp;#93;&lt;/span&gt; ? cl_io_slice_add+0x5c/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2d06992&amp;gt;&amp;#93;&lt;/span&gt; ? ktime_get_ts64+0x52/0xf0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3387480&amp;gt;&amp;#93;&lt;/span&gt; ? bit_wait+0x50/0x50&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3388a2d&amp;gt;&amp;#93;&lt;/span&gt; io_schedule_timeout+0xad/0x130&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3388ac8&amp;gt;&amp;#93;&lt;/span&gt; io_schedule+0x18/0x20&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3387491&amp;gt;&amp;#93;&lt;/span&gt; bit_wait_io+0x11/0x50&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3386fb7&amp;gt;&amp;#93;&lt;/span&gt; __wait_on_bit+0x67/0x90&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dbd3c1&amp;gt;&amp;#93;&lt;/span&gt; wait_on_page_bit+0x81/0xa0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2cc7010&amp;gt;&amp;#93;&lt;/span&gt; ? wake_bit_function+0x40/0x40&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd380b&amp;gt;&amp;#93;&lt;/span&gt; shrink_page_list+0x9eb/0xc30&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd2853&amp;gt;&amp;#93;&lt;/span&gt; ? isolate_lru_pages.isra.47+0xd3/0x190&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd4066&amp;gt;&amp;#93;&lt;/span&gt; shrink_inactive_list+0x1b6/0x5c0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dcd77e&amp;gt;&amp;#93;&lt;/span&gt; ? release_pages+0x24e/0x430&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd4b45&amp;gt;&amp;#93;&lt;/span&gt; shrink_lruvec+0x375/0x730&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2cd2c60&amp;gt;&amp;#93;&lt;/span&gt; ? task_rq_unlock+0x20/0x20&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd5d36&amp;gt;&amp;#93;&lt;/span&gt; mem_cgroup_shrink_node_zone+0xa6/0x170&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2e428c3&amp;gt;&amp;#93;&lt;/span&gt; mem_cgroup_soft_limit_reclaim+0x1e3/0x4b0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd60e0&amp;gt;&amp;#93;&lt;/span&gt; balance_pgdat+0x2e0/0x5e0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd6553&amp;gt;&amp;#93;&lt;/span&gt; kswapd+0x173/0x430&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2cc6f50&amp;gt;&amp;#93;&lt;/span&gt; ? wake_up_atomic_t+0x30/0x30&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2dd63e0&amp;gt;&amp;#93;&lt;/span&gt; ? balance_pgdat+0x5e0/0x5e0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2cc5e61&amp;gt;&amp;#93;&lt;/span&gt; kthread+0xd1/0xe0&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2cc5d90&amp;gt;&amp;#93;&lt;/span&gt; ? insert_kthread_work+0x40/0x40&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa3395ddd&amp;gt;&amp;#93;&lt;/span&gt; ret_from_fork_nospec_begin+0x7/0x21&lt;br/&gt;
Jan &#160;3 18:26:03 spool0121 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa2cc5d90&amp;gt;&amp;#93;&lt;/span&gt; ? insert_kthread_work+0x40/0x40&lt;/p&gt;</description>
                <environment>RHEL 7 - Kernel 3.10.0-1160.42.2.el7.x86_64</environment>
        <key id="67887">LU-15427</key>
            <summary>Lustre client hangs under memory pressue</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="raot">Joe Frith</reporter>
                        <labels>
                    </labels>
                <created>Mon, 10 Jan 2022 16:17:10 +0000</created>
                <updated>Mon, 10 Jan 2022 16:17:10 +0000</updated>
                                            <version>Lustre 2.12.8</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                    <customfield id="customfield_10030" key="com.atlassian.jira.plugin.system.customfieldtypes:labels">
                        <customfieldname>Epic/Theme</customfieldname>
                        <customfieldvalues>
                                        <label>patch</label>
    
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i02e5z:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10021"><![CDATA[2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>