<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:38:49 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10859] Deadlock with heavy memory pressure</title>
                <link>https://jira.whamcloud.com/browse/LU-10859</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;
On one Customer site, we hit following deadlock:

&#160; &#160; Thread 1:

&#160; &#160; ofd_object_punch

&#160;&#160; &#160; osd_punch

&#160; &#160; &#160; ldiskfs_truncate

&#160;&#160; &#160; &#160; ldiskfs_inode_attach_jinode

&#160;&#160; &#160; &#160; &#160; ...

&#160;&#160; &#160; &#160; &#160; do_try_to_free_pages

&#160; &#160; &#160; &#160; &#160; lu_cache_shrink

&#160;&#160; &#160; &#160; &#160; &#160; mutex_lock --&amp;gt;try to hold @lu_sites_guard

&#160;&#160; &#160;

&#160; &#160; kswapd thread2:

&#160; &#160; kthread

&#160;&#160; &#160; shrink_slab

&#160; &#160; &#160; lu_cache_shrink

&#160; &#160; &#160; &#160; mutex_lock ----&amp;gt;hold already.

&#160;&#160; &#160; &#160; &#160; ...

&#160;&#160; &#160; &#160; &#160; dqget

&#160; &#160; &#160; &#160; &#160; ldiskfs_acquire_dquot

&#160;&#160; &#160; &#160; &#160; &#160; jbd2__journal_start--&amp;gt;blocked to wait for more credits.

&#160;&#160; &#160;

&#160; &#160; Thread3:

&#160; &#160; kthread

&#160;&#160; &#160; kjournald2

&#160; &#160; &#160; jbd2_journal_commit_transaction--&amp;gt;blocked to wait Thread2 finished,

&#160;&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; since Thread1 add a handle into transaction.

&#160;&#160; &#160;

&#160; &#160; So deadlock happens because of Thread1 wait Thread2, Thread2 wait Thread3..

&#160; &#160; but Thread3 wait Thread1....

&#160;&#160; &#160;

&#160; &#160; This problem still exists even we have switched @lu_sites_guard

&#160; &#160; into a read/write lock, sine we hold write lock at lu_cahce_shrink().

&#160;&#160; &#160;

&#160; &#160; Fixed the problem by making ldiskfs_inode_attach_jinode() use

&#160; &#160; GPF_NOFS.

&#160;

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>RHEL7 Server&lt;br/&gt;
Lustre 2.7.x series</environment>
        <key id="51561">LU-10859</key>
            <summary>Deadlock with heavy memory pressure</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="wangshilong">Wang Shilong</assignee>
                                    <reporter username="wangshilong">Wang Shilong</reporter>
                        <labels>
                            <label>patch</label>
                    </labels>
                <created>Wed, 28 Mar 2018 01:42:21 +0000</created>
                <updated>Mon, 11 May 2020 17:56:04 +0000</updated>
                            <resolved>Mon, 9 Apr 2018 21:04:40 +0000</resolved>
                                                    <fixVersion>Lustre 2.12.0</fixVersion>
                    <fixVersion>Lustre 2.10.4</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>10</watches>
                                                                            <comments>
                            <comment id="224678" author="gerrit" created="Wed, 28 Mar 2018 01:43:58 +0000"  >&lt;p&gt;Wang Shilong (wshilong@ddn.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/31806&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/31806&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10859&quot; title=&quot;Deadlock with heavy memory pressure&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10859&quot;&gt;&lt;del&gt;LU-10859&lt;/del&gt;&lt;/a&gt; ldiskfs: fix deadlock with heavy preassure&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 475c42e60f16281b9fd5f928559e2f0a4a4b6952&lt;/p&gt;</comment>
                            <comment id="224680" author="pjones" created="Wed, 28 Mar 2018 01:50:58 +0000"  >&lt;p&gt;Thanks &lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=wangshilong&quot; class=&quot;user-hover&quot; rel=&quot;wangshilong&quot;&gt;wangshilong&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="224690" author="bfaccini" created="Wed, 28 Mar 2018 08:16:29 +0000"  >&lt;p&gt;yes, thanks to create both this public ticket and Gerrit change in my place ...&lt;/p&gt;</comment>
                            <comment id="224693" author="wangshilong" created="Wed, 28 Mar 2018 08:40:00 +0000"  >&lt;p&gt;Hi Bruno, sorry for that, we are a bit urgent for this issue.&lt;/p&gt;</comment>
                            <comment id="224696" author="adilger" created="Wed, 28 Mar 2018 09:21:52 +0000"  >&lt;p&gt;Bob, can you please add a follow-on patch for SLES, either using the same patch (if it applies cleanly) or new patches as needed, once this initial patch has passed review &amp;amp; testing. &lt;/p&gt;</comment>
                            <comment id="224698" author="wangshilong" created="Wed, 28 Mar 2018 09:46:01 +0000"  >&lt;p&gt;Yup, Andreas, I should included SLES updates too, but it looks a bit hard for me to grab source codes for it, Ihara also reminded we need patch for&#160;ubuntu14+16 for master too.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="224705" author="pjones" created="Wed, 28 Mar 2018 12:35:40 +0000"  >&lt;p&gt;We only support ubuntu16 on master - not ubuntu14&lt;/p&gt;</comment>
                            <comment id="224713" author="chunteraa" created="Wed, 28 Mar 2018 13:51:24 +0000"  >&lt;p&gt;Is this related to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9728&quot; title=&quot;out of memory on OSS causing allocation failures or hung threads&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9728&quot;&gt;&lt;del&gt;LU-9728&lt;/del&gt;&lt;/a&gt; ?&lt;/p&gt;</comment>
                            <comment id="224717" author="wangshilong" created="Wed, 28 Mar 2018 14:25:38 +0000"  >&lt;p&gt;Hello Chris,&lt;/p&gt;

&lt;p&gt;&#160; our ES3 have already included that patch, but still hit the problem, so it is different.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="224806" author="chunteraa" created="Thu, 29 Mar 2018 16:19:41 +0000"  >&lt;p&gt;patch &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9728&quot; title=&quot;out of memory on OSS causing allocation failures or hung threads&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9728&quot;&gt;&lt;del&gt;LU-9728&lt;/del&gt;&lt;/a&gt; uses GFP_HIGHUSER for allocations instead of GFP_NOFS&lt;/p&gt;

&lt;p&gt;kernel_patch filename is &quot;GPF_NOFS&quot; but alloc flag is GFP_NOFS&lt;br/&gt;
 &lt;a href=&quot;https://www.kernel.org/doc/gorman/html/understand/understand009.html&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://www.kernel.org/doc/gorman/html/understand/understand009.html&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="224812" author="gerrit" created="Thu, 29 Mar 2018 17:11:36 +0000"  >&lt;p&gt;Bob Glossman (bob.glossman@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/31825&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/31825&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10859&quot; title=&quot;Deadlock with heavy memory pressure&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10859&quot;&gt;&lt;del&gt;LU-10859&lt;/del&gt;&lt;/a&gt; ldiskfs: extend previous fix to SLES&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: c4956f2dff93c428b3040c1e03d08c14ec6232c8&lt;/p&gt;</comment>
                            <comment id="224814" author="bogl" created="Thu, 29 Mar 2018 17:16:35 +0000"  >&lt;blockquote&gt;
&lt;p&gt;Bob, can you please add a follow-on patch for SLES, either using the same patch (if it applies cleanly) or new patches as needed, once this initial patch has passed review &amp;amp; testing.&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;done&lt;/p&gt;</comment>
                            <comment id="224851" author="wangshilong" created="Fri, 30 Mar 2018 01:40:45 +0000"  >&lt;p&gt;Hello&#160;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=chunteraa&quot; class=&quot;user-hover&quot; rel=&quot;chunteraa&quot;&gt;chunteraa&lt;/a&gt;&#160;,&lt;/p&gt;

&lt;p&gt;Thanks for reminding, I refreshed the patch to fix that.&lt;/p&gt;</comment>
                            <comment id="225512" author="gerrit" created="Mon, 9 Apr 2018 19:51:37 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/31806/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/31806/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10859&quot; title=&quot;Deadlock with heavy memory pressure&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10859&quot;&gt;&lt;del&gt;LU-10859&lt;/del&gt;&lt;/a&gt; ldiskfs: fix deadlock with heavy memory preassure&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 0506e1bd6a6d5fafe7fc5e558aa1b75e456c2642&lt;/p&gt;</comment>
                            <comment id="225555" author="pjones" created="Mon, 9 Apr 2018 21:04:40 +0000"  >&lt;p&gt;&lt;font color=&quot;#000000&quot;&gt;Landed for 2.12&lt;/font&gt;&lt;/p&gt;</comment>
                            <comment id="226119" author="wangshilong" created="Tue, 17 Apr 2018 00:45:57 +0000"  >&lt;p&gt;FYI, we&apos;d better include this fix into b2_10 LTS branch.&lt;/p&gt;</comment>
                            <comment id="226282" author="gerrit" created="Wed, 18 Apr 2018 20:48:38 +0000"  >&lt;p&gt;Minh Diep (minh.diep@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/32058&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32058&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10859&quot; title=&quot;Deadlock with heavy memory pressure&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10859&quot;&gt;&lt;del&gt;LU-10859&lt;/del&gt;&lt;/a&gt; ldiskfs: fix deadlock with heavy memory preassure&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_10&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: c5a9c83471aa5b6e0a593b7b99760e86c8311bee&lt;/p&gt;</comment>
                            <comment id="227255" author="gerrit" created="Thu, 3 May 2018 20:00:37 +0000"  >&lt;p&gt;John L. Hammond (john.hammond@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/32058/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32058/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10859&quot; title=&quot;Deadlock with heavy memory pressure&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10859&quot;&gt;&lt;del&gt;LU-10859&lt;/del&gt;&lt;/a&gt; ldiskfs: fix deadlock with heavy memory preassure&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_10&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 0595d92ad03ab9d975d599aad204d746aff991b3&lt;/p&gt;</comment>
                            <comment id="228916" author="hornc" created="Thu, 31 May 2018 15:01:19 +0000"  >&lt;p&gt;&lt;del&gt;&lt;blockquote&gt;&lt;p&gt;Bob Glossman (bob.glossman@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/31825&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/31825&lt;/a&gt;&lt;br/&gt;
 Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10859&quot; title=&quot;Deadlock with heavy memory pressure&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10859&quot;&gt;&lt;del&gt;LU-10859&lt;/del&gt;&lt;/a&gt; ldiskfs: extend previous fix to SLES&lt;br/&gt;
 Project: fs/lustre-release&lt;br/&gt;
 Branch: master&lt;br/&gt;
 Current Patch Set: 1&lt;br/&gt;
 Commit: c4956f2dff93c428b3040c1e03d08c14ec6232c8&lt;/p&gt;&lt;/blockquote&gt;&lt;/del&gt;&lt;br/&gt;
&#160;&lt;/p&gt;

&lt;p&gt;&lt;del&gt;This patch was abandoned but its changes were never rolled into the primary patch for this ticket ( &lt;a href=&quot;https://review.whamcloud.com/31806/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/31806/&lt;/a&gt;). Should Bob&apos;s patch be revived?&lt;/del&gt;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;Edit: Nevermind, I misread the patches&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                                <inwardlinks description="is related to">
                                                        </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzuvz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>