<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:34:27 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-17317] sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0</title>
                <link>https://jira.whamcloud.com/browse/LU-17317</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for S Buisson &amp;lt;sbuisson@ddn.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/d7c41dec-3599-4738-b89d-03f240498d8c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/d7c41dec-3599-4738-b89d-03f240498d8c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_16 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;test all_off:60001:c0:60003:003, wanted 1 1, got 0 0
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Test session details:&lt;br/&gt;
clients: &lt;a href=&quot;https://build.whamcloud.com/job/lustre-b_es-reviews/15743&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-b_es-reviews/15743&lt;/a&gt; - 4.18.0-477.27.1.el8_8.x86_64&lt;br/&gt;
servers: &lt;a href=&quot;https://build.whamcloud.com/job/lustre-b_es-reviews/15743&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-b_es-reviews/15743&lt;/a&gt; - 4.18.0-477.27.1.el8_lustre.ddn17.x86_64&lt;/p&gt;








&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
sanity-sec test_16 - test all_off:60001:c0:60003:003, wanted 1 1, got 0 0&lt;/p&gt;</description>
                <environment></environment>
        <key id="79199">LU-17317</key>
            <summary>sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Tue, 28 Nov 2023 07:57:57 +0000</created>
                <updated>Tue, 9 Jan 2024 10:38:14 +0000</updated>
                            <resolved>Tue, 9 Jan 2024 10:38:14 +0000</resolved>
                                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="395307" author="sebastien" created="Mon, 4 Dec 2023 09:28:28 +0000"  >&lt;p&gt;For instance for this failure in sanity-sec test_17:&lt;br/&gt;
&lt;a href=&quot;https://testing.whamcloud.com/test_sets/1037004b-dbe8-44ef-a668-4eed6e6114eb&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/1037004b-dbe8-44ef-a668-4eed6e6114eb&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;We have the following nodes:&lt;/p&gt;
&lt;ul class=&quot;alternate&quot; type=&quot;square&quot;&gt;
	&lt;li&gt;MDS 1, MDS 3 (trevis-94vm6)&lt;br/&gt;
10.240.43.205@tcp&lt;/li&gt;
	&lt;li&gt;Client 1 (trevis-94vm1)&lt;br/&gt;
10.240.43.200@tcp&lt;/li&gt;
&lt;/ul&gt;


&lt;p&gt;The MDS wants a client to release a lock, by sending an LDLM_BL_CALLBACK request (104). But it gets an error from the client (called a &apos;reverse server&apos; in the GSS exchanges).&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000100:00100000:1.0:1701460059.716146:0:10439:0:(client.c:1758:ptlrpc_send_new_req()) Sending RPC req@0000000014e4d538 pname:cluuid:pid:xid:nid:opc:job mdt00_003:lustre-MDT0002_UUID:10439:1784106942685952:10.240.43.200@tcp:104:
00000100:00100000:1.0:1701460059.716168:0:10439:0:(client.c:2533:ptlrpc_set_wait()) set 00000000e75f5696 going to sleep for 11 seconds
02000000:00000400:1.0:1701460059.716391:0:10439:0:(sec_gss.c:685:gss_cli_ctx_handle_err_notify()) req x1784106942685952/t0, ctx 0000000082de400c idx 0x544590679e7e5f1c(0-&amp;gt;c): reverse server respond (00080000/00000000)
00000100:00020000:1.0:1701460059.716395:0:10439:0:(client.c:1479:after_reply()) @@@ unwrap reply failed: rc = -22  req@0000000014e4d538 x1784106942685952/t0(0) o104-&amp;gt;lustre-MDT0002@10.240.43.200@tcp:15/16 lens 328/224 e 0 to 0 dl 1701460070 ref 1 fl Rpc:RQU/0/ffffffff rc 0/-1 job:&apos;&apos;
00000100:00100000:1.0:1701460059.716403:0:10439:0:(client.c:2239:ptlrpc_check_set()) Completed RPC req@0000000014e4d538 pname:cluuid:pid:xid:nid:opc:job mdt00_003:lustre-MDT0002_UUID:10439:1784106942685952:10.240.43.200@tcp:104:
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;And indeed on the client, the GSS context id (544590679e7e5f1c) is considered invalid.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000100:00100000:0.0:1701460059.716218:0:8154:0:(events.c:373:request_in_callback()) peer: 12345-10.240.43.205@tcp (source: 12345-10.240.43.205@tcp)
02000000:00000400:0.0:1701460059.716236:0:207145:0:(gss_svc_upcall.c:1619:gss_svc_upcall_get_ctx()) Invalid gss ctx idx 0x544590679e7e5f1c from 10.240.43.205@tcp
02000000:08000000:0.0:1701460059.716239:0:207145:0:(sec_gss.c:1969:gss_pack_err_notify()) prepare gss error notify(0x80000/0x0) to 10.240.43.205@tcp
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;So this client ends up not refreshing its lock. This is a problem as file/dir access rights were changed from a different client.&lt;/p&gt;</comment>
                            <comment id="395990" author="gerrit" created="Fri, 8 Dec 2023 10:46:47 +0000"  >&lt;p&gt;&quot;Sebastien Buisson &amp;lt;sbuisson@ddn.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/53377&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/53377&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17317&quot; title=&quot;sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17317&quot;&gt;&lt;del&gt;LU-17317&lt;/del&gt;&lt;/a&gt; gss: no cache flush for rsi and rsc&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: a785f7c4c2a71064cb61023e479ded0347d16b72&lt;/p&gt;</comment>
                            <comment id="396036" author="sebastien" created="Fri, 8 Dec 2023 16:19:13 +0000"  >&lt;p&gt;The problem described here stems from the fact that server side can use outdated gss contexts in ldlm callbacks. Apparently this was fine with previous gss code based on sunrpc cache, because the cache entries were removed (very) asynchronously. With the new implementation based on the upcall cache, the cache entries are removed as they are found expired. This explains why with this new code, the server gets &lt;tt&gt;GSS_S_NO_CONTEXT&lt;/tt&gt; from an evicted client if the server has sent an outdated gss context.&lt;/p&gt;

&lt;p&gt;So patch &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17317&quot; title=&quot;sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17317&quot;&gt;&lt;del&gt;LU-17317&lt;/del&gt;&lt;/a&gt; gss: do not continue using expired reverse context&quot; &lt;a href=&quot;https://review.whamcloud.com/53375&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/53375&lt;/a&gt; aims at surviving this situation. The server is still allowed to try to use an outdated gss context (this is important for inflight communications), but if it gets &lt;tt&gt;GSS_S_NO_CONTEXT&lt;/tt&gt; from the client, then it marks this gss context as dead, and replaces it with a new one.&lt;/p&gt;</comment>
                            <comment id="396209" author="gerrit" created="Mon, 11 Dec 2023 08:15:37 +0000"  >&lt;p&gt;&quot;Sebastien Buisson &amp;lt;sbuisson@ddn.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/53405&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/53405&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17317&quot; title=&quot;sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17317&quot;&gt;&lt;del&gt;LU-17317&lt;/del&gt;&lt;/a&gt; dbg: investigate test failures - 1&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 4b9b24ab89f4992ba40272cb0fddda0636a0152e&lt;/p&gt;</comment>
                            <comment id="397553" author="gerrit" created="Wed, 20 Dec 2023 02:00:05 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/53377/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/53377/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17317&quot; title=&quot;sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17317&quot;&gt;&lt;del&gt;LU-17317&lt;/del&gt;&lt;/a&gt; gss: no cache flush for rsi and rsc&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 3615fa4a86be793652d53c94818c5aeb81e2257e&lt;/p&gt;</comment>
                            <comment id="398369" author="gerrit" created="Wed, 3 Jan 2024 03:03:06 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/53375/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/53375/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17317&quot; title=&quot;sanity-sec test_16: test all_off:60001:c0:60003:003, wanted 1 1, got 0 0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17317&quot;&gt;&lt;del&gt;LU-17317&lt;/del&gt;&lt;/a&gt; gss: do not continue using expired reverse context&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 67acf6047e343a0e35f077c6aed4483a14d2015c&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="78573">LU-17228</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="78924">LU-17286</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i042yv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>