<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:26:46 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16408] replay-dual test_33: unable to mount /mnt/lustre2</title>
                <link>https://jira.whamcloud.com/browse/LU-16408</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for jianyu &amp;lt;yujian@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/bd566ffb-4675-4852-9ac7-ec33bd93b99f&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/bd566ffb-4675-4852-9ac7-ec33bd93b99f&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_33 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Started lustre-MDT0000
Starting client: trevis-83vm7.trevis.whamcloud.com:  -o user_xattr,flock trevis-80vm7@tcp:/lustre /mnt/lustre2
CMD: trevis-83vm7.trevis.whamcloud.com mkdir -p /mnt/lustre2
CMD: trevis-83vm7.trevis.whamcloud.com mount -t lustre -o user_xattr,flock trevis-80vm7@tcp:/lustre /mnt/lustre2
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Dmesg on client:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;LustreError: 11-0: lustre-MDT0000-mdc-ffff9aa6d17cc800: operation mds_connect to node 10.240.42.182@tcp failed: rc = -11
LustreError: Skipped 3 previous similar messages
Lustre: lustre-OST0006-osc-ffff9aa6d92e2800: Connection to lustre-OST0006 (at 10.240.42.196@tcp) was lost; in progress operations using this service will wait for recovery to complete
Lustre: Skipped 6 previous similar messages
Lustre: lustre-OST0001-osc-ffff9aa6d92e2800: Connection restored to  (at 10.240.42.196@tcp) 
Lustre: Skipped 5 previous similar messages
LustreError: 10874:0:(lmv_obd.c:1287:lmv_statfs()) lustre-MDT0000-mdc-ffff9aa6d17cc800: can&apos;t stat MDS #0: rc = -11
Lustre: Unmounted lustre-client
LustreError: 10874:0:(super25.c:181:lustre_fill_super()) llite: Unable to mount &amp;lt;unknown&amp;gt;: rc = -11
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;





&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
replay-dual test_33 - Timeout occurred after 434 minutes, last suite running was replay-dual&lt;/p&gt;</description>
                <environment></environment>
        <key id="73655">LU-16408</key>
            <summary>replay-dual test_33: unable to mount /mnt/lustre2</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="eaujames">Etienne Aujames</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Thu, 15 Dec 2022 20:31:50 +0000</created>
                <updated>Fri, 27 Oct 2023 02:39:53 +0000</updated>
                            <resolved>Sat, 23 Sep 2023 14:10:16 +0000</resolved>
                                    <version>Lustre 2.16.0</version>
                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="356594" author="yujian" created="Thu, 15 Dec 2022 20:33:39 +0000"  >&lt;p&gt;The replay-dual test_33 was added by &lt;a href=&quot;https://review.whamcloud.com/48082&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48082&lt;/a&gt; (&quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15935&quot; title=&quot;MDT mount fails with &amp;quot;duplicate generation for client export&amp;quot; during failover&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15935&quot;&gt;&lt;del&gt;LU-15935&lt;/del&gt;&lt;/a&gt; target: keep track of multirpc slots in last_rcvd&quot;).&lt;br/&gt;
Hi &lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=eaujames&quot; class=&quot;user-hover&quot; rel=&quot;eaujames&quot;&gt;eaujames&lt;/a&gt;, could you please advise?&lt;/p&gt;</comment>
                            <comment id="367371" author="eaujames" created="Mon, 27 Mar 2023 09:21:14 +0000"  >&lt;p&gt;Hi,&lt;/p&gt;

&lt;p&gt;The mounted client did not finish completely its recovery and was evicted in REPLAY_LOCKS:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[Tue Nov 15 16:29:06 2022] LustreError: 876057:0:(mdt_handler.c:7441:mdt_iocontrol()) lustre-MDT0000: Aborting client recovery
[Tue Nov 15 16:29:06 2022] LustreError: 876057:0:(ldlm_lib.c:2888:target_stop_recovery_thread()) lustre-MDT0000: Aborting recovery
[Tue Nov 15 16:29:06 2022] Lustre: 874819:0:(ldlm_lib.c:2294:target_recovery_overseer()) recovery is aborted, evict exports in recovery
[Tue Nov 15 16:29:06 2022] Lustre: 874819:0:(ldlm_lib.c:2294:target_recovery_overseer()) Skipped 2 previous similar messages
[Tue Nov 15 16:29:06 2022] Lustre: lustre-MDT0000: disconnecting 2 stale clients
[Tue Nov 15 16:29:06 2022] LustreError: 874819:0:(tgt_grant.c:257:tgt_grant_sanity_check()) mdt_obd_disconnect: tot_granted 4194304 != fo_tot_granted 6291456
[Tue Nov 15 16:29:06 2022] LustreError: 874819:0:(ldlm_lib.c:1829:abort_lock_replay_queue()) @@@ aborted:  req@00000000b51e723d x1749569008570176/t0(0) o101-&amp;gt;1b7e53c5-3301-41c4-8e4d-aab3eade9ae8@10.240.42.242@tcp:151/0 lens 328/0 e 0 to 0 dl 1668529766 ref 1 fl Complete:/40/ffffffff rc 0/-1 job:&apos;ldlm_lock_repla.0&apos;
[Tue Nov 15 16:29:06 2022] LustreError: 874819:0:(ldlm_lib.c:1829:abort_lock_replay_queue()) Skipped 25 previous similar messages
[Tue Nov 15 16:29:06 2022] Lustre: lustre-MDT0000: Denying connection for new client 1b7e53c5-3301-41c4-8e4d-aab3eade9ae8 (at 10.240.42.242@tcp), waiting for 4 known clients (2 recovered, 0 in progress, and 2 evicted) to recover in 1:14
[Tue Nov 15 16:29:06 2022] Lustre: Skipped 3 previous similar messages &lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;But the client import is set to FULL, the MDT recovery did not finish and then the MDT was unmounted. After remounting the MDT the 2sd client is unable to remount.&lt;/p&gt;

&lt;p&gt;This looks like a new bug. For now, I will stabilize the test.&lt;/p&gt;</comment>
                            <comment id="367375" author="gerrit" created="Mon, 27 Mar 2023 10:24:42 +0000"  >&lt;p&gt;&quot;Etienne AUJAMES &amp;lt;eaujames@ddn.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50434&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50434&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16408&quot; title=&quot;replay-dual test_33: unable to mount /mnt/lustre2&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16408&quot;&gt;&lt;del&gt;LU-16408&lt;/del&gt;&lt;/a&gt; tests: fix replay-dual test 33&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: b513f684834cf0fc7ebab6b319fc2ae098ff60d6&lt;/p&gt;</comment>
                            <comment id="387016" author="gerrit" created="Sat, 23 Sep 2023 06:02:40 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50434/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50434/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16408&quot; title=&quot;replay-dual test_33: unable to mount /mnt/lustre2&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16408&quot;&gt;&lt;del&gt;LU-16408&lt;/del&gt;&lt;/a&gt; tests: fix replay-dual test 33&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 7f89e8c8975fcc82983c5756438861d66e64ec23&lt;/p&gt;</comment>
                            <comment id="387035" author="pjones" created="Sat, 23 Sep 2023 14:10:16 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                            <comment id="387087" author="bzzz" created="Mon, 25 Sep 2023 13:49:01 +0000"  >&lt;p&gt;the patch breaks replay-dual/33 on a local (single VM) setup. before it took ~30 seconds to complete replay-dual, now it can&apos;t complete within 30 minutes.&lt;/p&gt;</comment>
                            <comment id="387450" author="bzzz" created="Wed, 27 Sep 2023 19:23:11 +0000"  >&lt;p&gt;replay-dual/33 gets stuck at the following operation:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
	! combined_mgs_mds || $LCTL get_param mdc.*.ping || &lt;span class=&quot;code-keyword&quot;&gt;true&lt;/span&gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;can you please explain the purpose of this get_param ?&lt;/p&gt;</comment>
                            <comment id="387454" author="bzzz" created="Wed, 27 Sep 2023 19:39:23 +0000"  >&lt;p&gt;actually it mount_facet mds1 fails:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
[  122.710153] LustreError: 15c-8: MGC192.168.127.51@tcp: Confguration from log lustre-MDT0000 failed from MGS -5. Communication error between node &amp;amp; MGS, a bad configuration, or other errors. See syslog &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; more info
[  122.715086] LustreError: 7365:0:(tgt_mount.c:1524:server_start_targets()) failed to start server lustre-MDT0000: -5
[  122.715704] LustreError: 7365:0:(tgt_mount.c:2216:server_fill_super()) Unable to start targets: -5
[  122.716325] LustreError: 7365:0:(tgt_mount.c:1752:server_put_super()) no obd lustre-MDT0000
[  122.718737] Lustre: server umount lustre-MDT0000 complete
[  122.719112] LustreError: 7365:0:(super25.c:188:lustre_fill_super()) llite: Unable to mount &amp;lt;unknown&amp;gt;: rc = -5
mount.lustre: mount /dev/mapper/mds1_flakey at /mnt/lustre-mds1 failed: Input/output error
Is the MGS running?
Start of /dev/mapper/mds1_flakey on mds1 failed 5
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="387455" author="eaujames" created="Wed, 27 Sep 2023 19:51:46 +0000"  >&lt;p&gt;Yes, for combined mgt/mdt, when we umount the target (failover) we disable all mgs services. So the IR (Imperative Recovery) is disabled, then the targets states are not directly updated. In the real world it has to wait for the next pinger ping (obd_timeout/4 s).&lt;br/&gt;
The &quot;ping&quot; here is workarround to force update the import state.&lt;/p&gt;

&lt;p&gt;I think the issue here is that if the client is the on the MGS, it uses a pingless connection on 0@lo.&lt;br/&gt;
We have to skip this test for single node testing.&lt;/p&gt;

&lt;p&gt;Do you have a failed test link with logs?&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                                        </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="78613">LU-17229</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i0384n:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>