<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:04:26 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-13813] conf-sanity test_112: can&apos;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN</title>
                <link>https://jira.whamcloud.com/browse/LU-13813</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for vik &amp;lt;vlapa@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/c03460d0-489d-4fbb-84e5-d7df9a59d9dc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/c03460d0-489d-4fbb-84e5-d7df9a59d9dc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_112 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;import is not in FULL state
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Investigation showed that MDS was not connected during start_mds  test step in _wait_import_state()&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;can\&apos;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;debug log from vm2 contains messages about import state changes. &lt;br/&gt;
MDT0000_UUID: changing import state from DISCONN to CONNECTING and &lt;br/&gt;
MDT0000_UUID: changing import state from CONNECTING to DISCONN&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000100:00080000:1.0:1594563480.058266:0:25586:0:(import.c:86:import_set_state_nolock()) ffff9a285a1e5000 lustre-MDT0000_UUID: changing import state from DISCONN to CONNECTING
00000100:00080000:1.0:1594563480.058358:0:25586:0:(pinger.c:242:ptlrpc_pinger_process_import()) 2d768d9f-aa8c-42e0-a75c-fa93c720357c-&amp;gt;lustre-MDT0000_UUID: level DISCONN/3 force 0 force_next 0 deactive 0 pingable 1 suppress 0
00000100:00080000:1.0:1594563480.058361:0:25586:0:(import.c:86:import_set_state_nolock()) ffff9a287aae0000 lustre-MDT0000_UUID: changing import state from DISCONN to CONNECTING
00000100:00080000:1.0:1594563480.059863:0:10210:0:(import.c:86:import_set_state_nolock()) ffff9a285a1e5000 lustre-MDT0000_UUID: changing import state from CONNECTING to DISCONN
00000100:00080000:1.0:1594563480.059906:0:10210:0:(import.c:86:import_set_state_nolock()) ffff9a287aae0000 lustre-MDT0000_UUID: changing import state from CONNECTING to DISCONN
00000001:02000400:0.0:1594563481.248258:0:24754:0:(debug.c:712:libcfs_debug_mark_buffer()) DEBUG MARKER: /usr/sbin/lctl mark  rpc : @@@@@@ FAIL: can\&apos;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN
00000001:02000400:1.0:1594563481.249585:0:24755:0:(debug.c:712:libcfs_debug_mark_buffer()) DEBUG MARKER: /usr/sbin/lctl mark  rpc : @@@@@@ FAIL: can\&apos;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Started lustre-MDT0000
CMD: onyx-42vm1.onyx.whamcloud.com,onyx-42vm2 PATH=/usr/lib64/lustre/tests:/usr/lib/lustre/tests:/usr/lib64/lustre/tests:/opt/iozone/bin:/opt/iozone/bin:/opt/iozone/bin:/usr/lib64/lustre/tests/mpi:/usr/lib64/lustre/tests/racer:/usr/lib64/lustre/../lustre-iokit/sgpdd-survey:/usr/lib64/lustre/tests:/usr/lib64/lustre/utils/gss:/usr/lib64/lustre/utils:/usr/lib64/qt-3.3/bin:/usr/lib64/openmpi/bin:/usr/local/sbin:/usr/local/bin:/usr/sbin:/usr/bin:/usr/sbin:/sbin:/bin::/sbin:/bin:/usr/sbin: NAME=autotest_config bash rpc.sh wait_import_state_mount FULL mdc.lustre-MDT0000-mdc-*.mds_server_uuid 
onyx-42vm1: == rpc test complete, duration -o sec ================================================================ 13:53:10 (1594561990)
onyx-42vm2: == rpc test complete, duration -o sec ================================================================ 13:53:10 (1594561990)
onyx-42vm1: CMD: onyx-42vm4 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm2: CMD: onyx-42vm4 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm1: CMD: onyx-42vm4 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm2: CMD: onyx-42vm4 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm1: CMD: onyx-42vm3 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm2: CMD: onyx-42vm3 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm1: CMD: onyx-42vm1.onyx.whamcloud.com /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm2: CMD: onyx-42vm2.onyx.whamcloud.com /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
onyx-42vm1: onyx-42vm1.onyx.whamcloud.com: executing wait_import_state_mount FULL mdc.lustre-MDT0000-mdc-*.mds_server_uuid
onyx-42vm2: onyx-42vm2.onyx.whamcloud.com: executing wait_import_state_mount FULL mdc.lustre-MDT0000-mdc-*.mds_server_uuid
onyx-42vm2: CMD: onyx-42vm2.onyx.whamcloud.com lctl get_param -n at_max
onyx-42vm2:  rpc : @@@@@@ FAIL: can&apos;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN 
onyx-42vm2:   Trace dump:
onyx-42vm2:   = /usr/lib64/lustre/tests/test-framework.sh:6216:error()
onyx-42vm2:   = /usr/lib64/lustre/tests/test-framework.sh:7395:_wait_import_state()
onyx-42vm2:   = /usr/lib64/lustre/tests/test-framework.sh:7417:wait_import_state()
onyx-42vm2:   = /usr/lib64/lustre/tests/test-framework.sh:7426:wait_import_state_mount()
onyx-42vm2:   = rpc.sh:18:main()
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;







&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
conf-sanity test_112 - import is not in FULL state&lt;/p&gt;</description>
                <environment></environment>
        <key id="60085">LU-13813</key>
            <summary>conf-sanity test_112: can&apos;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="yujian">Jian Yu</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Wed, 22 Jul 2020 16:01:28 +0000</created>
                <updated>Mon, 27 Mar 2023 21:13:44 +0000</updated>
                            <resolved>Fri, 19 Aug 2022 16:03:02 +0000</resolved>
                                    <version>Lustre 2.14.0</version>
                    <version>Lustre 2.15.0</version>
                                    <fixVersion>Lustre 2.16.0</fixVersion>
                    <fixVersion>Lustre 2.15.2</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="291384" author="adilger" created="Sat, 6 Feb 2021 01:21:56 +0000"  >&lt;p&gt;Fixed via &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13184&quot; title=&quot;conf-sanity test_112: problem creating f112.conf-sanity.0 on OST0000&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13184&quot;&gt;&lt;del&gt;LU-13184&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="292318" author="jamesanunez" created="Thu, 18 Feb 2021 16:59:50 +0000"  >&lt;p&gt;It looks like we&#8217;re seeing this issue or something similar for 2.14.0-RC3 ldiskfs non-DNE testing; &lt;a href=&quot;https://testing.whamcloud.com/test_sets/14efbbbc-a9fd-4ed7-999c-71e1f38af9a6&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/14efbbbc-a9fd-4ed7-999c-71e1f38af9a6&lt;/a&gt; . If this is a new issue, I can close this ticket and open a new one.&lt;/p&gt;

&lt;p&gt;The client error messages look the same, but on the MDS (vm4), we see  the DISCONN to CONNECTING state changes:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00000100:00080000:0.0:1613560151.829979:0:3006202:0:(import.c:86:import_set_state_nolock()) 0000000059d48be4 lustre-OST0000_UUID: changing import state from CONNECTING to DISCONN
00000100:00000001:1.0:1613560151.829981:0:3128009:0:(pinger.c:158:ptlrpc_ping()) Process leaving (rc=0 : 0 : 0)
00000020:00000001:1.0:1613560151.829983:0:3128009:0:(lprocfs_status.c:1609:lprocfs_read_helper()) Process leaving (rc=276728730 : 276728730 : 107e8b9a)
00000020:00000001:1.0:1613560151.829984:0:3128009:0:(lprocfs_status.c:1609:lprocfs_read_helper()) Process leaving (rc=18446744073561016351 : -148535265 : fffffffff725881f)
00000100:00080000:0.0:1613560151.829984:0:3006202:0:(import.c:1440:ptlrpc_connect_interpret()) recovery of lustre-OST0000_UUID on 10.2.8.108@tcp failed (-110)
00000100:00000040:1.0:1613560151.829985:0:3128009:0:(pinger.c:322:ptlrpc_pinger_main()) next wakeup in 5 (51652)
00000100:00000001:0.0:1613560151.829985:0:3006202:0:(import.c:1446:ptlrpc_connect_interpret()) Process leaving (rc=18446744073709551506 : -110 : ffffffffffffff92)
00000100:00080000:1.0:1613560151.829986:0:3128009:0:(pinger.c:249:ptlrpc_pinger_process_import()) lustre-MDT0000-mdtlov_UUID-&amp;gt;lustre-OST0000_UUID: level DISCONN/3 force 1 force_next 0 deactive 0 pingable 0 suppress 1
00000100:00000040:0.0:1613560151.829986:0:3006202:0:(lustre_net.h:2470:ptlrpc_rqphase_move()) @@@ move request phase from Interpret to Complete  req@00000000e533b5b3 x1691936139685568/t0(0) o8-&amp;gt;lustre-OST0000-osc-MDT0000@10.2.8.108@tcp:28/4 lens 520/544 e 0 to 1 dl 1613560151 ref 1 fl Interpret:EXNQU/0/ffffffff rc -110/-1 job:&apos;kworker/u4:1.0&apos;
00000100:00000001:1.0:1613560151.829988:0:3128009:0:(recover.c:56:ptlrpc_initiate_recovery()) Process entered
00000100:00080000:1.0:1613560151.829989:0:3128009:0:(recover.c:58:ptlrpc_initiate_recovery()) lustre-OST0000_UUID: starting recovery
00000100:00000001:1.0:1613560151.829990:0:3128009:0:(import.c:697:ptlrpc_connect_import_locked()) Process entered
00000100:00080000:1.0:1613560151.829990:0:3128009:0:(import.c:86:import_set_state_nolock()) 0000000059d48be4 lustre-OST0000_UUID: changing import state from DISCONN to CONNECTING
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="329678" author="adilger" created="Sat, 19 Mar 2022 23:35:01 +0000"  >&lt;p&gt;+1 on master: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/7fb8c261-d3c5-4f43-af97-6cb1e10724ad&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/7fb8c261-d3c5-4f43-af97-6cb1e10724ad&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="339345" author="adilger" created="Thu, 30 Jun 2022 22:13:28 +0000"  >&lt;p&gt;It seems all PASS cases are with DNE mode, and all failed for single MDS. &lt;/p&gt;

&lt;p&gt;Should we just add an &lt;tt&gt;((MDSCOUNT &amp;gt;= 2))&lt;/tt&gt; check?  I don&apos;t know &lt;em&gt;why&lt;/em&gt; this is failing only for single-MDS tests and passing for DNE, but at least we wouldn&apos;t have continuous failures.&lt;/p&gt;</comment>
                            <comment id="341310" author="yujian" created="Fri, 22 Jul 2022 23:23:19 +0000"  >&lt;p&gt;The failure can be reproduced by running test 112 after test 111. It passed in review test sessions because test 111 was skipped with SLOW=no.&lt;br/&gt;
I&apos;m working on a patch to fix the test script.&lt;br/&gt;
&#160;&lt;/p&gt;</comment>
                            <comment id="341318" author="gerrit" created="Sat, 23 Jul 2022 07:22:29 +0000"  >&lt;p&gt;&quot;Jian Yu &amp;lt;yujian@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/48021&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48021&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13813&quot; title=&quot;conf-sanity test_112: can&amp;#39;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13813&quot;&gt;&lt;del&gt;LU-13813&lt;/del&gt;&lt;/a&gt; tests: fix stack_trap in conf-sanity test 110/111&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: f6ad9782eed05eaa9b2af29e70080652e0d03e10&lt;/p&gt;</comment>
                            <comment id="341319" author="gerrit" created="Sat, 23 Jul 2022 07:28:24 +0000"  >&lt;p&gt;&quot;Jian Yu &amp;lt;yujian@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/48022&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48022&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13813&quot; title=&quot;conf-sanity test_112: can&amp;#39;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13813&quot;&gt;&lt;del&gt;LU-13813&lt;/del&gt;&lt;/a&gt; tests: fix stack_trap in conf-sanity test 110/111&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 77c40a5864758698bf92f74ff419b00491d402c8&lt;/p&gt;</comment>
                            <comment id="344049" author="gerrit" created="Fri, 19 Aug 2022 04:33:02 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/48022/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48022/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13813&quot; title=&quot;conf-sanity test_112: can&amp;#39;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13813&quot;&gt;&lt;del&gt;LU-13813&lt;/del&gt;&lt;/a&gt; tests: fix stack_trap in conf-sanity test 110/111&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 0109cee2610b8dfeaaca25c3eb1e805e033c593d&lt;/p&gt;</comment>
                            <comment id="344119" author="pjones" created="Fri, 19 Aug 2022 16:03:02 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                            <comment id="344180" author="gerrit" created="Sat, 20 Aug 2022 16:14:14 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/48021/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/48021/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13813&quot; title=&quot;conf-sanity test_112: can&amp;#39;t put import for mdc.lustre-MDT0000-mdc-*.mds_server_uuid into FULL state after 1475 sec, have DISCONN&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13813&quot;&gt;&lt;del&gt;LU-13813&lt;/del&gt;&lt;/a&gt; tests: fix stack_trap in conf-sanity test 110/111&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 0331d908abcb026fb450241ac8566d1a2bf425bc&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="57148">LU-12857</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="58029">LU-13221</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="57023">LU-12818</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="57959">LU-13184</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i015wf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>