<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:23:31 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16046] Shared-file I/O performance is poor under group lock</title>
                <link>https://jira.whamcloud.com/browse/LU-16046</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9964&quot; title=&quot;&amp;gt; 1 group lock on same file (group lock lifecycle/cbpending problem)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9964&quot;&gt;&lt;del&gt;LU-9964&lt;/del&gt;&lt;/a&gt; fixed the crashes but made unlocks synchronous, as the result group unlock may take dozens of seconds. Precisely, the test is N ranks opening (+O_CREAT) the same file, taking a group lock, writing 1MB segments for a total of 128GB (each rank writes 128GB/rank count) at a stride of (1MB*rank count), fysnc() and group unlock. Timings are similar regardless of MPI barriers after each phase or no barriers.&lt;/p&gt;

&lt;p&gt;The ticket is to make group unlock asynchronous.&lt;/p&gt;</description>
                <environment></environment>
        <key id="71489">LU-16046</key>
            <summary>Shared-file I/O performance is poor under group lock</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="vitaly_fertman">Vitaly Fertman</assignee>
                                    <reporter username="vitaly_fertman">Vitaly Fertman</reporter>
                        <labels>
                    </labels>
                <created>Mon, 25 Jul 2022 15:10:31 +0000</created>
                <updated>Tue, 7 Mar 2023 16:30:10 +0000</updated>
                            <resolved>Mon, 14 Nov 2022 14:17:52 +0000</resolved>
                                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="341457" author="gerrit" created="Mon, 25 Jul 2022 15:21:37 +0000"  >&lt;p&gt;&quot;Vitaly Fertman &amp;lt;vitaly.fertman@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/48037&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48037&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; revert: &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9964&quot; title=&quot;&amp;gt; 1 group lock on same file (group lock lifecycle/cbpending problem)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9964&quot;&gt;&lt;del&gt;LU-9964&lt;/del&gt;&lt;/a&gt; llite: prevent mulitple group locks&quot;&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 0209c56134919eed6e81c006e3eb45e77656bab9&lt;/p&gt;</comment>
                            <comment id="341458" author="gerrit" created="Mon, 25 Jul 2022 15:21:38 +0000"  >&lt;p&gt;&quot;Vitaly Fertman &amp;lt;vitaly.fertman@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/48038&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48038&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; ldlm: group lock fix&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 74fd9699bb25e6e607b4c7401d05e69c27594e20&lt;/p&gt;</comment>
                            <comment id="349787" author="gerrit" created="Sat, 15 Oct 2022 05:58:31 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/48037/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/48037/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; revert: &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9964&quot; title=&quot;&amp;gt; 1 group lock on same file (group lock lifecycle/cbpending problem)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9964&quot;&gt;&lt;del&gt;LU-9964&lt;/del&gt;&lt;/a&gt; llite: prevent mulitple group locks&quot;&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: bc37f89a81ea0a2fae8668e21247552e8894bfd8&lt;/p&gt;</comment>
                            <comment id="349788" author="gerrit" created="Sat, 15 Oct 2022 05:58:42 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/48038/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/48038/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; ldlm: group lock fix&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 3ffcb5b700ebfd68dba4daca4192fdacaf7fd541&lt;/p&gt;</comment>
                            <comment id="349810" author="pjones" created="Sun, 16 Oct 2022 01:13:15 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                            <comment id="349858" author="bzzz" created="Mon, 17 Oct 2022 13:51:44 +0000"  >&lt;p&gt;bisection points to this patch.&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
[  106.147323] Lustre: DEBUG MARKER: == sanity test 184e: Recreate layout after stripeless layout swaps ========================================================== 13:37:47 (1666013867)
[  106.450660] BUG: sleeping function called from invalid context at kernel/locking/mutex.c:934
[  106.450907] in_atomic(): 1, irqs_disabled(): 0, pid: 9400, name: lfs
[  106.451024] INFO: lockdep is turned off.
[  106.451101] CPU: 0 PID: 9400 Comm: lfs Tainted: G        W  O     --------- -  - 4.18.0 #1
[  106.451235] Hardware name: Bochs Bochs, BIOS Bochs 01/01/2011
[  106.451346] Call Trace:
[  106.451403]  dump_stack+0x5c/0x80
[  106.451480]  ___might_sleep.cold.21+0x9b/0xa8
[  106.451550]  __mutex_lock+0x41/0x930
[  106.451628]  ? osc_grouplock_dec+0x28/0x1a0 [osc]
[  106.451717]  osc_grouplock_dec+0x28/0x1a0 [osc]
[  106.451805]  osc_object_ast_clear+0x1ba/0x370 [osc]
[  106.451882]  ? osc_attr_get+0x30/0x30 [osc]
[  106.451988]  ldlm_resource_foreach+0xcc/0x280 [ptlrpc]
[  106.452081]  ? osc_attr_get+0x30/0x30 [osc]
[  106.452175]  ldlm_resource_iterate+0x122/0x180 [ptlrpc]
[  106.452273]  osc_object_prune+0x50/0x90 [osc]
[  106.452377]  cl_object_prune+0x50/0x130 [obdclass]
[  106.452521]  lov_delete_composite+0xfc/0x490 [lov]
[  106.452611]  lov_conf_set+0x654/0xb10 [lov]
[  106.452695]  cl_conf_set+0x58/0x130 [obdclass]
[  106.452788]  ll_layout_conf+0x120/0x400 [lustre]
[  106.452872]  ? ll_layout_refresh+0x6e3/0x1440 [lustre]
[  106.452956]  ll_layout_refresh+0x6e3/0x1440 [lustre]
[  106.453039]  vvp_io_init+0x209/0x360 [lustre]
[  106.453135]  __cl_io_init.isra.2+0x7f/0x150 [obdclass]
[  106.453224]  cl_setattr_ost+0x19c/0x2f0 [lustre]
[  106.453308]  ll_setattr_raw+0x10a3/0x1340 [lustre]
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
COMMIT		TESTED	PASSED	FAILED		COMMIT DESCRIPTION
3ffcb5b700	4	3	1	BAD	LU-16046 ldlm: group lock fix
bc37f89a81	10	10	0	GOOD	LU-16046 revert: &lt;span class=&quot;code-quote&quot;&gt;&quot;LU-9964 llite: prevent mulitple group locks&quot;&lt;/span&gt;
59f0d69168	10	10	0	GOOD	LU-15721 llite: only statfs &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; projid &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; PROJINHERIT set
a41ee518f0	10	10	0	GOOD	LU-16219 tests: syntax error fix
e174717923	10	10	0	GOOD	LU-16198 tests: increase margin &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; sanity/33hh
af0ce0ca76	10	10	0	GOOD	LU-16200 tests: test_32[f,g]: specify blocksize explicitly
d3074511f3	10	10	0	GOOD	LU-16180 ptlrpc: reduce lock contention in ptlrpc_free_committed
f5ca6853b8	10	10	0	GOOD	LU-16076 utils: enhance &lt;span class=&quot;code-quote&quot;&gt;&apos;lfs check&apos;&lt;/span&gt; command
0bb491b2ec	10	10	0	GOOD	LU-16044 osd: discard pagecache in truncate&apos;s declaration
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="350900" author="vitaly_fertman" created="Wed, 26 Oct 2022 22:20:14 +0000"  >&lt;p&gt;Alex, a link to a failure please ?&lt;/p&gt;</comment>
                            <comment id="350949" author="bzzz" created="Thu, 27 Oct 2022 05:26:25 +0000"  >&lt;blockquote&gt;&lt;p&gt;Alex, a link to a failure please ?&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;this is a local setup. AT doesn&apos;t hit this because AT&apos;s kernel has no debugging enabled (e.g. CONFIG_DEBUG_ATOMIC_SLEEP)&lt;/p&gt;</comment>
                            <comment id="352347" author="spitzcor" created="Wed, 9 Nov 2022 19:13:07 +0000"  >&lt;p&gt;&lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/49008&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/49008&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="352867" author="gerrit" created="Mon, 14 Nov 2022 08:26:40 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/49008/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/49008/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; ldlm: group lock unlock fix&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 3dc261c06434eceee3ba9ef86d1f376954b2d234&lt;/p&gt;</comment>
                            <comment id="352903" author="pjones" created="Mon, 14 Nov 2022 14:17:52 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                            <comment id="364852" author="gerrit" created="Fri, 3 Mar 2023 17:14:53 +0000"  >&lt;p&gt;&quot;Etienne AUJAMES &amp;lt;eaujames@ddn.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50201&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50201&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; ldlm: group lock unlock fix&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 3aed6087019b12bbaaeeaa0fdec37650242ee41b&lt;/p&gt;</comment>
                            <comment id="365091" author="gerrit" created="Tue, 7 Mar 2023 16:30:10 +0000"  >&lt;p&gt;&quot;Andreas Dilger &amp;lt;adilger@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50226&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50226&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16046&quot; title=&quot;Shared-file I/O performance is poor under group lock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16046&quot;&gt;&lt;del&gt;LU-16046&lt;/del&gt;&lt;/a&gt; ldlm: group lock unlock fix&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 200a29391b5d78ef964e958ed5f6dd19e322f2f0&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="48242">LU-9964</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i02vfb:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>