<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:19:28 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-15572] Interop sanity-flr failing with &quot;cannot get UNLOCK lease&quot;</title>
                <link>https://jira.whamcloud.com/browse/LU-15572</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Running sanity-flr in interop mode fails a number of subtests:&lt;br/&gt;
&lt;a href=&quot;https://testing.whamcloud.com/test_sets/0a29fd64-d2e6-4cbf-b636-b1deae709128&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/0a29fd64-d2e6-4cbf-b636-b1deae709128&lt;/a&gt;&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;lfs mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
</description>
                <environment></environment>
        <key id="68768">LU-15572</key>
            <summary>Interop sanity-flr failing with &quot;cannot get UNLOCK lease&quot;</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="adilger">Andreas Dilger</reporter>
                        <labels>
                    </labels>
                <created>Sun, 20 Feb 2022 17:19:22 +0000</created>
                <updated>Wed, 21 Dec 2022 22:47:23 +0000</updated>
                            <resolved>Sat, 5 Mar 2022 21:00:31 +0000</resolved>
                                    <version>Lustre 2.15.0</version>
                    <version>Lustre 2.15.1</version>
                                    <fixVersion>Lustre 2.15.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="326792" author="adilger" created="Sun, 20 Feb 2022 17:27:51 +0000"  >&lt;p&gt;Temporarily bumping this up to a blocker to ensure it is reviewed. This appears to be a real interop issue between 2.14.0 and 2.15.0, and not only a test script issue. &lt;/p&gt;</comment>
                            <comment id="326793" author="adilger" created="Sun, 20 Feb 2022 17:29:10 +0000"  >&lt;p&gt;This may have been introduced with the landing of patch &lt;a href=&quot;https://review.whamcloud.com/45636&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45636&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15268&quot; title=&quot;lfs mirror extend error propagation&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15268&quot;&gt;&lt;del&gt;LU-15268&lt;/del&gt;&lt;/a&gt; &#8216;mdt: reveal the real intent close error code&lt;/tt&gt;&quot;., which is also causing other interop failures like &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15552&quot; title=&quot;Interop: sanity-flr test 0d fails with &amp;#39;exceeded maximum mirror count returns 16 not ERANGE(34)&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15552&quot;&gt;LU-15552&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="326794" author="adilger" created="Sun, 20 Feb 2022 17:34:00 +0000"  >&lt;p&gt;This affects sanity-flr test_0b test_50a test_60b test_61b test_203 &lt;/p&gt;</comment>
                            <comment id="326798" author="adilger" created="Sun, 20 Feb 2022 18:32:29 +0000"  >&lt;p&gt;Bobijam, could you please take a look at this. It looks like more than just a test script issue, but an actual interop bug with FLR, since it is failing in a variety of different tests. &lt;/p&gt;</comment>
                            <comment id="326802" author="adilger" created="Sun, 20 Feb 2022 19:05:28 +0000"  >&lt;p&gt;This is also causing sanity test_272d, test_272e, and test_272f to fail in interop testing. &lt;/p&gt;</comment>
                            <comment id="327232" author="bobijam" created="Thu, 24 Feb 2022 09:22:59 +0000"  >&lt;p&gt;Could be an interop issue between 2.15.0 client and 2.14.0 MDS on mirror split operation.&lt;/p&gt;

&lt;p&gt;test_0b:&lt;br/&gt;
lfs mirror mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)&lt;br/&gt;
error lfs mirror delete: cannot split &apos;/mnt/lustre/d0b.sanity-flr/f0b.sanity-flr&apos;: Device or resource busy&lt;/p&gt;

&lt;p&gt;test_50A:&lt;br/&gt;
lfs mirror mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)&lt;br/&gt;
error lfs mirror split: cannot split &apos;/mnt/lustre/d50A.sanity-flr/f50A.sanity-flr&apos;: Device or resource busy&lt;/p&gt;

&lt;p&gt;test_60b:&lt;br/&gt;
lfs mirror mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)&lt;br/&gt;
error lfs mirror split: cannot split &apos;/mnt/lustre/d60b.sanity-flr/f60b.sanity-flr&apos;: Device or resource busy&lt;/p&gt;

&lt;p&gt;test_61b:&lt;br/&gt;
lfs mirror mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)&lt;br/&gt;
error lfs mirror split: cannot split &apos;/mnt/lustre/d61b.sanity-flr/f61b.sanity-flr&apos;: Device or resource busy&lt;/p&gt;

&lt;p&gt;test_203:&lt;br/&gt;
lfs mirror mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)&lt;br/&gt;
error lfs mirror delete: cannot split &apos;/mnt/lustre/f203.sanity-flr&apos;: Device or resource busy&lt;/p&gt;

&lt;p&gt;take test_60b as an example:&lt;br/&gt;
on MDS, it received the file close intent for mirror split request, and finished it successfully&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000100:00100000:1.0:1645359656.359528:0:991126:0:(service.c:2142:ptlrpc_server_handle_req_in()) got req x1725282051462784
00000100:00100000:1.0:1645359656.359542:0:991126:0:(service.c:2299:ptlrpc_server_handle_request()) Handling RPC req@0000000030f1e911 pname:cluuid+ref:pid:xid:nid:opc:job mdt_rdpg00_001:67bf88ef-fd73-4c00-9a58-d65897456138+35:1227937:x1725282051462784:12345-10.240.25.52@tcp:35:lfs.0
...
00000100:00100000:1.0:1645359656.362030:0:991126:0:(service.c:2348:ptlrpc_server_handle_request()) Handled RPC req@0000000030f1e911 pname:cluuid+ref:pid:xid:nid:opc:job mdt_rdpg00_001:67bf88ef-fd73-4c00-9a58-d65897456138+32:1227937:x1725282051462784:12345-10.240.25.52@tcp:35:lfs.0 Request processed in 2487us (2537us total) trans 85899346091 rc 0/0
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;while on client, I don&apos;t see the failure reason&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000080:00200000:1.0:1645359656.359344:0:1227937:0:(file.c:3896:ll_file_ioctl()) VFS Op:inode=[0x2000090a6:0x4e:0x0](00000000a9e821ea), cmd=c00c66f3
00000002:00100000:1.0:1645359656.359354:0:1227937:0:(mdc_request.c:944:mdc_close()) @@@ matched open  req@00000000d7fc9409 x1725282051460736/t85899346086(85899346086) o101-&amp;gt;lustre-MDT0000-mdc-ffff913d103c9000@10.240.25.55@tcp:12/10 lens 576/656 e 0 to 0 dl 1645359663 ref 1 fl Complete:RPQU/4/ffffffff rc 0/-1 job:&apos;lfs.0&apos;
00000100:00100000:1.0:1645359656.359372:0:1227937:0:(client.c:742:ptlrpc_reassign_next_xid()) @@@ reassign xid  req@000000008e2795d6 x1725282051462784/t0(0) o35-&amp;gt;lustre-MDT0000-mdc-ffff913d103c9000@10.240.25.55@tcp:23/10 lens 504/1072 e 0 to 0 dl 0 ref 1 fl New:QU/0/ffffffff rc 0/-1 job:&apos;&apos;
00000100:00100000:1.0:1645359656.359378:0:1227937:0:(client.c:1733:ptlrpc_send_new_req()) Sending RPC req@000000008e2795d6 pname:cluuid:pid:xid:nid:opc:job lfs:67bf88ef-fd73-4c00-9a58-d65897456138:1227937:1725282051462784:10.240.25.55@tcp:35:lfs.0
...
00000100:00100000:1.0:1645359656.362161:0:1227937:0:(client.c:2210:ptlrpc_check_set()) Completed RPC req@000000008e2795d6 pname:cluuid:pid:xid:nid:opc:job lfs:67bf88ef-fd73-4c00-9a58-d65897456138:1227937:1725282051462784:10.240.25.55@tcp:35:lfs.0
00000002:00100000:1.0:1645359656.362168:0:1227937:0:(mdc_request.c:854:mdc_free_open()) @@@ free open request, rq_replay=0  req@00000000d7fc9409 x1725282051460736/t85899346086(85899346086) o101-&amp;gt;lustre-MDT0000-mdc-ffff913d103c9000@10.240.25.55@tcp:12/10 lens 576/656 e 0 to 0 dl 1645359663 ref 1 fl Complete:RQU/4/ffffffff rc 0/-1 job:&apos;lfs.0&apos;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="327236" author="bobijam" created="Thu, 24 Feb 2022 10:16:27 +0000"  >&lt;p&gt;The patch &lt;a href=&quot;https://review.whamcloud.com/45636&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45636&lt;/a&gt;&#160;&quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15268&quot; title=&quot;lfs mirror extend error propagation&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15268&quot;&gt;&lt;del&gt;LU-15268&lt;/del&gt;&lt;/a&gt;&#160;&#8216;mdt: reveal the real intent close error code&lt;/tt&gt;&quot; is a server only patch, it should something else causing the interop failure.&lt;/p&gt;</comment>
                            <comment id="327245" author="bobijam" created="Thu, 24 Feb 2022 10:38:21 +0000"  >&lt;p&gt;I think it could be patch &lt;a href=&quot;https://review.whamcloud.com/42116&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/42116&lt;/a&gt; &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14521&quot; title=&quot;delete FLR mirrors without volatile files&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14521&quot;&gt;&lt;del&gt;LU-14521&lt;/del&gt;&lt;/a&gt; &apos;flr: delete mirror without volatile file&apos;&quot; does not catch proper error code from old MDS (it expects -EINVAL from MDS while old server returns -EBUSY in mirror delete).&lt;/p&gt;</comment>
                            <comment id="327246" author="bobijam" created="Thu, 24 Feb 2022 10:42:26 +0000"  >&lt;p&gt;Could use following patch for 2.15 to catch older MDS ambiguous error code&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
diff --git a/lustre/utils/lfs.c b/lustre/utils/lfs.c
index 3a1511fe05..e5d245af3e 100644
--- a/lustre/utils/lfs.c
+++ b/lustre/utils/lfs.c
@@ -2329,7 +2329,7 @@ again:
&#160; &#160; &#160; &#160; data-&amp;gt;lil_ids[1] = mirror_id;
&#160; &#160; &#160; &#160; rc = llapi_lease_set(fd, data);
&#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (rc &amp;lt;= 0) {
- &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (rc == -EINVAL &amp;amp;&amp;amp; purge) {
+ &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (purge) {
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-comment&quot;&gt;/* could be old MDS which prohibit fd==fdv */&lt;/span&gt;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; purge = &lt;span class=&quot;code-keyword&quot;&gt;false&lt;/span&gt;;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;goto&lt;/span&gt; again; &lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="327288" author="adilger" created="Thu, 24 Feb 2022 16:13:50 +0000"  >&lt;p&gt;Bobijam, rather than pasting the patch here as a comment, could you please submit it as a patch to Gerrit and add a Test-Parameters line to run it in interop mode:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Test-Parameters: trivial serverversion=2.14.0 testlist=sanity env=ONLY=&quot;0 50 60 61&quot;
Test-Parameters: clientversion=2.14.0 testlist=sanity env=ONLY=&quot;0 50 60 61&quot;
Test-Parameters: serverversion=2.12.8 testlist=sanity env=ONLY=&quot;0 50 60 61&quot;
Test-Parameters: clientversion=2.12.8 testlist=sanity env=ONLY=&quot;0 50 60 61&quot;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="327379" author="gerrit" created="Fri, 25 Feb 2022 08:41:27 +0000"  >&lt;p&gt;&quot;Bobi Jam &amp;lt;bobijam@hotmail.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/46614&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/46614&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15572&quot; title=&quot;Interop sanity-flr failing with &amp;quot;cannot get UNLOCK lease&amp;quot;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15572&quot;&gt;&lt;del&gt;LU-15572&lt;/del&gt;&lt;/a&gt; util: mirror delete with old MDS&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: cdd3a1299ca77face6078caa254ffa2b493cbf3e&lt;/p&gt;</comment>
                            <comment id="328196" author="gerrit" created="Sat, 5 Mar 2022 20:42:31 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/46614/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/46614/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15572&quot; title=&quot;Interop sanity-flr failing with &amp;quot;cannot get UNLOCK lease&amp;quot;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15572&quot;&gt;&lt;del&gt;LU-15572&lt;/del&gt;&lt;/a&gt; util: mirror delete with old MDS&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 79f8a4a38c71c7f06ac561ca4cd6d6b9cb5aa4fb&lt;/p&gt;</comment>
                            <comment id="328206" author="pjones" created="Sat, 5 Mar 2022 21:00:31 +0000"  >&lt;p&gt;Landed for 2.15&lt;/p&gt;</comment>
                            <comment id="342305" author="sarah" created="Tue, 2 Aug 2022 19:30:01 +0000"  >&lt;p&gt;Still seeing this error in sanity-flr test_50a in 2.15.1 interop with 2.12.9 el7.9 servers. In the current testing, it seems only happened to subtest 50a&lt;br/&gt;
&lt;a href=&quot;https://testing.whamcloud.com/test_sets/1f2bc891-06de-4859-97b1-f51a7ed6cf2f&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/1f2bc891-06de-4859-97b1-f51a7ed6cf2f&lt;/a&gt;&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;trevis-96vm2: trevis-96vm2.trevis.whamcloud.com: executing wait_import_state_mount (FULL|IDLE) mdc.lustre-MDT0000-mdc-*.mds_server_uuid
trevis-96vm1: CMD: trevis-96vm1.trevis.whamcloud.com lctl get_param -n at_max
trevis-96vm1: mdc.lustre-MDT0000-mdc-*.mds_server_uuid in FULL state after 0 sec
trevis-96vm2: CMD: trevis-96vm2.trevis.whamcloud.com lctl get_param -n at_max
trevis-96vm2: mdc.lustre-MDT0000-mdc-*.mds_server_uuid in FULL state after 0 sec
lfs mirror mirror: cannot get UNLOCK lease, ext 8: Device or resource busy (16)
/mnt/lustre/d50A.sanity-flr/f50A.sanity-flr layout generation from 2 to 1
 sanity-flr test_50A: @@@@@@ FAIL: split does not increase layout gen from 2 to 1 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="68638">LU-15552</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="67297">LU-15268</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i02iu7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>