<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:32:29 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10149] sanityn test_23: timeout after test_18 mmap_sanity takes thousands of seconds</title>
                <link>https://jira.whamcloud.com/browse/LU-10149</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for jianyu &amp;lt;jian.yu@intel.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/99cbc9cc-b407-11e7-9eee-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/99cbc9cc-b407-11e7-9eee-5254006e85c2&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;The sub-test test_23 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Timeout occurred after 151 mins, last suite running was sanityn, restarting cluster to continue tests
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Please provide additional information about the failure here.&lt;/p&gt;

&lt;p&gt;Info required for matching: sanityn 23&lt;/p&gt;</description>
                <environment></environment>
        <key id="48877">LU-10149</key>
            <summary>sanityn test_23: timeout after test_18 mmap_sanity takes thousands of seconds</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="bfaccini">Bruno Faccini</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Mon, 23 Oct 2017 07:28:20 +0000</created>
                <updated>Fri, 26 Jan 2018 20:15:54 +0000</updated>
                            <resolved>Fri, 26 Jan 2018 20:15:54 +0000</resolved>
                                    <version>Lustre 2.11.0</version>
                                    <fixVersion>Lustre 2.11.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="211644" author="yujian" created="Mon, 23 Oct 2017 07:30:22 +0000"  >&lt;p&gt;More failure instance on master branch:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/3c3a6f64-b58f-11e7-8afb-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/3c3a6f64-b58f-11e7-8afb-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="211705" author="gerrit" created="Mon, 23 Oct 2017 17:06:56 +0000"  >&lt;p&gt;Faccini Bruno (bruno.faccini@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/29715&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/29715&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10149&quot; title=&quot;sanityn test_23: timeout after test_18 mmap_sanity takes thousands of seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10149&quot;&gt;&lt;del&gt;LU-10149&lt;/del&gt;&lt;/a&gt; tests: avoid live-lock with concurrent memsets&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 6679ad023c6c63bb9495eed570e8dd9ad06f3e9a&lt;/p&gt;</comment>
                            <comment id="211707" author="bfaccini" created="Mon, 23 Oct 2017 17:09:38 +0000"  >&lt;p&gt;Change #29175 is an attempt to split and delay concurrent memsets to reduce the execution time of auto-tests using mmap_sanity, due to some possible live-lock situation likely to occur.&lt;/p&gt;</comment>
                            <comment id="213174" author="adilger" created="Wed, 8 Nov 2017 20:53:01 +0000"  >&lt;p&gt;While this is a workaround for the test failures (which should land, don&apos;t get me wrong), it would be better to have some way to ensure that the client is at least making some forward progress when faulting in pages, so that applications using mmap don&apos;t fall over so badly.&lt;/p&gt;

&lt;p&gt;One option would be to use a delay mechanism in the DLM lock cancellation, so that mmap locks cannot be cancelled within, say, 10ms of being granted or last modified.  Secondly, in the two-node mmap case (and in other DLM lock ping-pong cases, we should look at reducing extent lock expansion (e.g. to 1MB) so that multiple writers are not causing needless lock contention.  That would allow one node to get some work done, and hopefully move out of the IO range of the other node so they can work independently.&lt;/p&gt;</comment>
                            <comment id="213207" author="bfaccini" created="Thu, 9 Nov 2017 10:53:58 +0000"  >&lt;p&gt;Andreas,&lt;br/&gt;
As per my heavy testing results, my current fix attempt (by splitting and delaying concurrent memsets) in change #29175 is not a 100% workaround.&lt;br/&gt;
Thus I was already trying to find a more definitive way to fix, and delay DLM lock cancelation had also appeared a good way to me. I should push a new patch to implement this soon.&lt;br/&gt;
I will also investigate the way of extent lock expansion reduction that you have pointed, thanks.&lt;/p&gt;

</comment>
                            <comment id="214368" author="yujian" created="Tue, 21 Nov 2017 19:50:12 +0000"  >&lt;p&gt;More failure instances on master branch:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/b059527a-ce17-11e7-9c63-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/b059527a-ce17-11e7-9c63-52540065bddc&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/6ddc3400-ce74-11e7-9c63-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/6ddc3400-ce74-11e7-9c63-52540065bddc&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/cae1c010-cbc3-11e7-a066-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/cae1c010-cbc3-11e7-a066-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="215909" author="gerrit" created="Mon, 11 Dec 2017 09:56:25 +0000"  >&lt;p&gt;Faccini Bruno (bruno.faccini@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/30465&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/30465&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10149&quot; title=&quot;sanityn test_23: timeout after test_18 mmap_sanity takes thousands of seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10149&quot;&gt;&lt;del&gt;LU-10149&lt;/del&gt;&lt;/a&gt; llite: avoid live-lock when concurrent mmap()s&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 783df45c6faf25c51add9d2965604599ead6f0d5&lt;/p&gt;</comment>
                            <comment id="215910" author="bfaccini" created="Mon, 11 Dec 2017 10:01:42 +0000"  >&lt;p&gt;Change #30465 is an attempt to fix in a more generic way the live-lock upon concurrent mmap()s situation.&lt;/p&gt;</comment>
                            <comment id="217050" author="gerrit" created="Fri, 22 Dec 2017 06:49:33 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/30465/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/30465/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10149&quot; title=&quot;sanityn test_23: timeout after test_18 mmap_sanity takes thousands of seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10149&quot;&gt;&lt;del&gt;LU-10149&lt;/del&gt;&lt;/a&gt; llite: avoid live-lock when concurrent mmap()s&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: cd793b4067b62862185f481cfef7b779927b801f&lt;/p&gt;</comment>
                            <comment id="218331" author="bfaccini" created="Tue, 16 Jan 2018 17:23:13 +0000"  >&lt;p&gt;Change #29715 has been abandoned in favor of more generic change #30465.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="49068">LU-10184</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="13530">LU-1205</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzmb3:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>