<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:33:05 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-17154] parallel-scale-nfsv4: hangs on umount after racer_on_nfs</title>
                <link>https://jira.whamcloud.com/browse/LU-17154</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for jianyu &amp;lt;yujian@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/568e0c21-9347-476a-beac-081e9b2ee112&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/568e0c21-9347-476a-beac-081e9b2ee112&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Test session details:&lt;br/&gt;
clients: &lt;a href=&quot;https://build.whamcloud.com/job/lustre-master/4468&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-master/4468&lt;/a&gt; - 5.14.0-284.25.1.el9_2.x86_64&lt;br/&gt;
servers: &lt;a href=&quot;https://build.whamcloud.com/job/lustre-master/4468&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-master/4468&lt;/a&gt; - 5.14.0-284.25.1_lustre.el9.x86_64&lt;/p&gt;

&lt;p&gt;&amp;lt;&amp;lt;Please provide additional information about the failure here&amp;gt;&amp;gt;&lt;/p&gt;

&lt;p&gt;parallel-scale-nfsv4 hangs on:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Stopping client trevis-27vm4 /mnt/lustre (opts:-f)
CMD: trevis-27vm4 lsof -t /mnt/lustre
pdsh@trevis-27vm1: trevis-27vm4: ssh exited with exit code 1
CMD: trevis-27vm4 umount -f /mnt/lustre 2&amp;gt;&amp;amp;1
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Console long on trevis-27vm4:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[70712.060132] Lustre: DEBUG MARKER: umount -f /mnt/lustre 2&amp;gt;&amp;amp;1
[70712.213680] Lustre: setting import lustre-MDT0000_UUID INACTIVE by administrator request
[70712.215066] LustreError: 2067684:0:(file.c:245:ll_close_inode_openhandle()) lustre-clilmv-ffffa03d96d7f000: inode [0x200000bd3:0x2c31:0x0] mdc close failed: rc = -108
[70712.243116] Lustre: 1411383:0:(llite_lib.c:3965:ll_dirty_page_discard_warn()) lustre: dirty page discard: 10.240.38.143@tcp:/lustre/fid: [0x28000040a:0x3699:0x0]/ may get corrupted (rc -108)
[70712.243167] Lustre: 1411382:0:(llite_lib.c:3965:ll_dirty_page_discard_warn()) lustre: dirty page discard: 10.240.38.143@tcp:/lustre/fid: [0x2c000040a:0x3318:0x0]/ may get corrupted (rc -108)
&amp;lt;~snip~&amp;gt;
[70742.217783] Lustre: lustre-MDT0000: haven&apos;t heard from client 0e545e12-9ad6-4857-a78b-e65f011477b4 (at 0@lo) in 31 seconds. I think it&apos;s dead, and I am evicting it. exp 00000000320f809c, cur 1695838270 expire 1695838240 last 1695838239
[70745.262062] Lustre: lustre-MDT0002: haven&apos;t heard from client 0e545e12-9ad6-4857-a78b-e65f011477b4 (at 0@lo) in 34 seconds. I think it&apos;s dead, and I am evicting it. exp 00000000887f97a0, cur 1695838273 expire 1695838243 last 1695838239
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="78167">LU-17154</key>
            <summary>parallel-scale-nfsv4: hangs on umount after racer_on_nfs</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="Deiter">Alex Deiter</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Thu, 28 Sep 2023 04:26:44 +0000</created>
                <updated>Thu, 25 Jan 2024 08:36:57 +0000</updated>
                                            <version>Lustre 2.16.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="387936" author="adilger" created="Tue, 3 Oct 2023 04:48:31 +0000"  >&lt;p&gt;It looks like parallel-scale-nfsv4 is failing to unmount cleanly when racer is run, and unmounted properly when racer_on_nfs is skipped. I haven&apos;t checked why racer is skipped, but I wonder if it should always be skipped?  Otherwise, it makes all of the NFS testing unreliable?  &lt;/p&gt;

&lt;p&gt;It does appear that there are some cases where racer_on_nfs is run AND the test unmounts properly, but unfortunately it is difficult to search for this in Maloo easily. &lt;/p&gt;
</comment>
                            <comment id="387937" author="adilger" created="Tue, 3 Oct 2023 05:01:40 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=Deiter&quot; class=&quot;user-hover&quot; rel=&quot;Deiter&quot;&gt;Deiter&lt;/a&gt;, could you please submit a patch to master and b_es6_0 to add racer_on_nfs to the always_except list. It looks like the &lt;tt&gt;parallel&amp;#45;scale&amp;#45;nfs&amp;#45;&lt;b&gt;v4&lt;/b&gt;.sh&lt;/tt&gt; script is incorrectly checking:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
export ALWAYS_EXCEPT=&lt;span class=&quot;code-quote&quot;&gt;&quot;$PARALLEL_SCALE_NFSV3_EXCEPT &quot;&lt;/span&gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;so this should also be updated to check &lt;tt&gt;PARALLEL_SCALE_NFSV4_EXCEPT&lt;/tt&gt;. It may be that this is why racer_on_nfs is sometimes being skipped when running &lt;tt&gt;parallel&amp;#45;scale&amp;#45;nfsv4&lt;/tt&gt; - when it is run after &lt;tt&gt;paralle\l-scale&amp;#45;nfsv3&lt;/tt&gt;?&lt;/p&gt;

&lt;p&gt;It would also be useful to see if the passing cases (without unmount timeout) are only for interop (I saw one case with ddn31 or similar, not sure of others).  Checking this, and going back through the test history to see if there was a time this was passing regularly would help isolate if there was a patch landed that caused this problem. &lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=yujian&quot; class=&quot;user-hover&quot; rel=&quot;yujian&quot;&gt;yujian&lt;/a&gt;, can you please re-add NFS testing to your patches, but skip racer:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Test-Parameters: trivial
Test-Parameters: testlist=env=PARALLEL_SCALE_NFSV3_EXCEPT=racer_on_nfs 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;This should hopefully now pass. &lt;/p&gt;</comment>
                            <comment id="388008" author="yujian" created="Tue, 3 Oct 2023 20:56:46 +0000"  >&lt;p&gt;Sure, &lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=adilger&quot; class=&quot;user-hover&quot; rel=&quot;adilger&quot;&gt;adilger&lt;/a&gt;. I found ALWAYS_EXCEPT was not defined in parallel-scale-nfsv4.sh, so while updating patch &lt;a href=&quot;https://review.whamcloud.com/52533&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/52533&lt;/a&gt;, I added it and also added racer_on_nfs test into the always_except list.&lt;/p&gt;</comment>
                            <comment id="388173" author="adilger" created="Wed, 4 Oct 2023 23:33:41 +0000"  >&lt;p&gt;You are right.  I guess I was mistakenly looking at the nfsv3.sh file, and there is nothing in the nfsv4.sh file that allows setting &lt;tt&gt;ALWAYS_EXCEPT&lt;/tt&gt;.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="78157">LU-17152</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="51511">LU-10851</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i03wzz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>