<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:26:55 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16425] Interop recovery-small test_144a: MDT failover took 252 seconds</title>
                <link>https://jira.whamcloud.com/browse/LU-16425</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for sarah &amp;lt;sarah@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/e76c370c-50f6-449d-a1ff-7c6e1dd6389a&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/e76c370c-50f6-449d-a1ff-7c6e1dd6389a&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_144a failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;MDT failover took 252 seconds
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Interop between 2.14 server and 2.15.2 client&lt;br/&gt;
client 1 demsg&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[15447.569384] Lustre: DEBUG MARKER: /usr/sbin/lctl mark == recovery-small test 144a: MDT failover should stop precreation threads ========================================================== 08:27:49 \(1670833669\)
[15447.946594] Lustre: DEBUG MARKER: == recovery-small test 144a: MDT failover should stop precreation threads ========================================================== 08:27:49 (1670833669)
[15455.634777] LustreError: 11-0: lustre-OST0000-osc-ffff8bba43bf3800: operation ost_setattr to node 10.240.25.240@tcp failed: rc = -19
[15455.638069] LustreError: Skipped 9 previous similar messages
[15455.639023] Lustre: lustre-OST0000-osc-ffff8bba43bf3800: Connection to lustre-OST0000 (at 10.240.25.240@tcp) was lost; in progress operations using this service will wait for recovery to complete
[15455.641714] Lustre: Skipped 9 previous similar messages
[15480.556202] Lustre: DEBUG MARKER: PATH=/usr/lib64/lustre/tests:/usr/lib/lustre/tests:/usr/lib64/lustre/tests:/opt/iozone/bin:/opt/iozone/bin:/opt/iozone/bin:/usr/lib64/lustre/tests/mpi:/usr/lib64/lustre/tests/racer:/usr/lib64/lustre/../lustre-iokit/sgpdd-survey:/usr/lib64/lustre/tests:/us
[15483.390342] Lustre: DEBUG MARKER: /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
[15483.788979] Lustre: DEBUG MARKER: /usr/sbin/lctl mark onyx-70vm7.onyx.whamcloud.com: executing wait_import_state_mount \(FULL\|IDLE\) osc.lustre-OST0000-osc-[-0-9a-f]*.ost_server_uuid
[15484.158321] Lustre: DEBUG MARKER: onyx-70vm7.onyx.whamcloud.com: executing wait_import_state_mount (FULL|IDLE) osc.lustre-OST0000-osc-[-0-9a-f]*.ost_server_uuid
[15484.257913] Lustre: DEBUG MARKER: lctl get_param -n at_max
[15484.644084] Lustre: DEBUG MARKER: /usr/sbin/lctl mark osc.lustre-OST0000-osc-[-0-9a-f]*.ost_server_uuid in FULL state after 0 sec
[15485.024198] Lustre: DEBUG MARKER: osc.lustre-OST0000-osc-[-0-9a-f]*.ost_server_uuid in FULL state after 0 sec
[15574.629865] Lustre: 1011245:0:(client.c:2295:ptlrpc_expire_one_request()) @@@ Request sent has timed out for slow reply: [sent 1670833677/real 1670833677] &#160;req@0000000031b8d95f x1751984860062976/t0(0) o101-&amp;gt;lustre-MDT0000-mdc-ffff8bba43bf3800@10.240.25.241@tcp:12/10 lens 4616/70232 e 1 to 1 dl 1670833796 ref 2 fl Rpc:XPQr/0/ffffffff rc 0/-1 job:&apos;touch.0&apos;
[15574.634758] Lustre: 1011245:0:(client.c:2295:ptlrpc_expire_one_request()) Skipped 20 previous similar messages
[15605.861791] INFO: task touch:1011244 blocked for more than 120 seconds.
[15605.867361] &#160; &#160; &#160; Tainted: G &#160; &#160; &#160; &#160; &#160; OE &#160; &#160;--------- - &#160;- 4.18.0-372.32.1.el8_6.x86_64 #1
[15605.868711] &quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot; disables this message.
[15605.869986] task:touch &#160; &#160; &#160; &#160; &#160; state:D stack: &#160; &#160;0 pid:1011244 ppid:1010843 flags:0x00000084
[15605.871366] Call Trace:
[15605.871840] &#160;__schedule+0x2d1/0x840
[15605.872494] &#160;schedule+0x35/0xa0
[15605.873061] &#160;rwsem_down_write_slowpath+0x30c/0x5c0
[15605.873902] &#160;path_openat+0x34b/0x14f0
[15605.874570] &#160;do_filp_open+0x93/0x100
[15605.875200] &#160;? getname_flags+0x4a/0x1e0
[15605.875863] &#160;? __check_object_size+0xac/0x173
[15605.876612] &#160;do_sys_open+0x188/0x220
[15605.877245] &#160;do_syscall_64+0x5b/0x1b0
[15605.877906] &#160;entry_SYSCALL_64_after_hwframe+0x61/0xc6
[15605.878763] RIP: 0033:0x7f460cf5e272
[15605.879394] Code: Unable to access opcode bytes at RIP 0x7f460cf5e248.
[15605.880454] RSP: 002b:00007ffd1250d590 EFLAGS: 00000246 ORIG_RAX: 0000000000000101
[15605.881684] RAX: ffffffffffffffda RBX: 00000000ffffffff RCX: 00007f460cf5e272
[15605.882843] RDX: 0000000000000941 RSI: 00007ffd1250e40d RDI: 00000000ffffff9c
[15605.883998] RBP: 0000000000000000 R08: 0000000000000000 R09: 0000000000000001
[15605.885152] R10: 00000000000001b6 R11: 0000000000000246 R12: 0000000000000001
[15605.886307] R13: 0000000000000001 R14: 00007ffd1250e40d R15: 00007f460d1fd374
[15728.741044] INFO: task touch:1011244 blocked for more than 120 seconds.
[15728.742186] &#160; &#160; &#160; Tainted: G &#160; &#160; &#160; &#160; &#160; OE &#160; &#160;--------- - &#160;- 4.18.0-372.32.1.el8_6.x86_64 #1
[15728.743540] &quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot; disables this message.
[15728.744802] task:touch &#160; &#160; &#160; &#160; &#160; state:D stack: &#160; &#160;0 pid:1011244 ppid:1010843 flags:0x00000084
[15728.746176] Call Trace:
[15728.746643] &#160;__schedule+0x2d1/0x840
[15728.747256] &#160;schedule+0x35/0xa0
[15728.747813] &#160;rwsem_down_write_slowpath+0x30c/0x5c0
[15728.748625] &#160;path_openat+0x34b/0x14f0
[15728.749264] &#160;do_filp_open+0x93/0x100
[15728.749889] &#160;? getname_flags+0x4a/0x1e0
[15728.750551] &#160;? __check_object_size+0xac/0x173
[15728.751295] &#160;do_sys_open+0x188/0x220
[15728.751916] &#160;do_syscall_64+0x5b/0x1b0
[15728.752556] &#160;entry_SYSCALL_64_after_hwframe+0x61/0xc6
[15728.753405] RIP: 0033:0x7f460cf5e272
[15728.754051] Code: Unable to access opcode bytes at RIP 0x7f460cf5e248.
[15728.755123] RSP: 002b:00007ffd1250d590 EFLAGS: 00000246 ORIG_RAX: 0000000000000101
[15728.756352] RAX: ffffffffffffffda RBX: 00000000ffffffff RCX: 00007f460cf5e272
[15728.757513] RDX: 0000000000000941 RSI: 00007ffd1250e40d RDI: 00000000ffffff9c
[15728.758670] RBP: 0000000000000000 R08: 0000000000000000 R09: 0000000000000001
[15728.759833] R10: 00000000000001b6 R11: 0000000000000246 R12: 0000000000000001
[15728.760992] R13: 0000000000000001 R14: 00007ffd1250e40d R15: 00007f460d1fd374
[15767.588855] LustreError: 166-1: MGC10.240.25.241@tcp: Connection to MGS (at 10.240.25.241@tcp) was lost; in progress operations using this service will fail
[15767.591087] LustreError: Skipped 5 previous similar messages
[15784.933984] Lustre: Evicted from MGS (at 10.240.25.241@tcp) after server handle changed from 0x7461a63767ab7b63 to 0x7461a63767ab8ac8
[15784.935919] Lustre: Skipped 3 previous similar messages
[15784.937420] Lustre: MGC10.240.25.241@tcp: Connection restored to 10.240.25.241@tcp (at 10.240.25.241@tcp)
[15784.938977] Lustre: Skipped 14 previous similar messages
[15792.511591] Lustre: DEBUG MARKER: PATH=/usr/lib64/lustre/tests:/usr/lib/lustre/tests:/usr/lib64/lustre/tests:/opt/iozone/bin:/opt/iozone/bin:/opt/iozone/bin:/usr/lib64/lustre/tests/mpi:/usr/lib64/lustre/tests/racer:/usr/lib64/lustre/../lustre-iokit/sgpdd-survey:/usr/lib64/lustre/tests:/us
[15795.354174] Lustre: DEBUG MARKER: /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
[15795.750211] Lustre: DEBUG MARKER: /usr/sbin/lctl mark onyx-70vm7.onyx.whamcloud.com: executing wait_import_state_mount \(FULL\|IDLE\) mdc.lustre-MDT0000-mdc-*.mds_server_uuid
[15796.139101] Lustre: DEBUG MARKER: onyx-70vm7.onyx.whamcloud.com: executing wait_import_state_mount (FULL|IDLE) mdc.lustre-MDT0000-mdc-*.mds_server_uuid
[15796.227757] Lustre: DEBUG MARKER: lctl get_param -n at_max
[15796.603890] Lustre: DEBUG MARKER: /usr/sbin/lctl mark mdc.lustre-MDT0000-mdc-*.mds_server_uuid in FULL state after 0 sec
[15797.004999] Lustre: DEBUG MARKER: mdc.lustre-MDT0000-mdc-*.mds_server_uuid in FULL state after 0 sec
[15798.902782] Lustre: DEBUG MARKER: /usr/sbin/lctl mark &#160;recovery-small test_144a: @@@@@@ FAIL: MDT failover took 252 seconds&#160;
[15799.270104] Lustre: DEBUG MARKER: recovery-small test_144a: @@@@@@ FAIL: MDT failover took 252 seconds
[15799.693930] Lustre: DEBUG MARKER: /usr/sbin/lctl dk &amp;gt; /autotest/autotest-1/2022-12-11/lustre-b2_15_full-part-1_44_61_9513f440-0dd9-4552-b71e-4aba705566d8//recovery-small.test_144a.debug_log.$(hostname -s).1670834021.log;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160;dmesg &amp;gt; /autotest/autotest-1/2022-12-11/lustre-b2_15_full-part-1_4&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
recovery-small test_144a - MDT failover took 252 seconds&lt;/p&gt;</description>
                <environment></environment>
        <key id="73723">LU-16425</key>
            <summary>Interop recovery-small test_144a: MDT failover took 252 seconds</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="sarah">Sarah Liu</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Thu, 22 Dec 2022 01:31:54 +0000</created>
                <updated>Thu, 8 Feb 2024 07:32:39 +0000</updated>
                            <resolved>Thu, 8 Feb 2024 07:32:39 +0000</resolved>
                                    <version>Lustre 2.15.2</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="357261" author="adilger" created="Thu, 22 Dec 2022 18:21:21 +0000"  >&lt;p&gt;The recovery-small test_144a was added in patch &lt;a href=&quot;https://review.whamcloud.com/47006&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/47006&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15724&quot; title=&quot;MDT failover hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15724&quot;&gt;&lt;del&gt;LU-15724&lt;/del&gt;&lt;/a&gt; tests: MDT failover hang reproducer&lt;/tt&gt;&quot; (commit &lt;tt&gt;v2_15_1-36-g9d1805c8b&lt;/tt&gt;) and should be skipped for MDS version 2.15.1 and older.&lt;/p&gt;</comment>
                            <comment id="359541" author="gerrit" created="Wed, 18 Jan 2023 19:26:06 +0000"  >&lt;p&gt;&quot;Sarah Liu &amp;lt;sarah@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/49680&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/49680&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16425&quot; title=&quot;Interop recovery-small test_144a: MDT failover took 252 seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16425&quot;&gt;&lt;del&gt;LU-16425&lt;/del&gt;&lt;/a&gt; tests: skip recovery-small test_144a in interop&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 805fc370158d677b8526c2292b33cff65a5a2bef&lt;/p&gt;</comment>
                            <comment id="359595" author="adilger" created="Thu, 19 Jan 2023 01:11:52 +0000"  >&lt;p&gt;&quot;Andreas Dilger &amp;lt;adilger@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/49679&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/49679&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16425&quot; title=&quot;Interop recovery-small test_144a: MDT failover took 252 seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16425&quot;&gt;&lt;del&gt;LU-16425&lt;/del&gt;&lt;/a&gt; tests: skip interop recovery-small/144a/144b&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 8fc6f1e316e08a8d3172021528189002de7b26c4&lt;/p&gt;</comment>
                            <comment id="359596" author="adilger" created="Thu, 19 Jan 2023 01:12:51 +0000"  >&lt;p&gt;&quot;Andreas Dilger &amp;lt;adilger@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/49681&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/49681&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16425&quot; title=&quot;Interop recovery-small test_144a: MDT failover took 252 seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16425&quot;&gt;&lt;del&gt;LU-16425&lt;/del&gt;&lt;/a&gt; tests: skip interop recovery-small/144a&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 17202a93ca9876017c8fc60f6cf2643f80bc0f58&lt;/p&gt;</comment>
                            <comment id="360985" author="gerrit" created="Tue, 31 Jan 2023 02:35:01 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/49679/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/49679/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16425&quot; title=&quot;Interop recovery-small test_144a: MDT failover took 252 seconds&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16425&quot;&gt;&lt;del&gt;LU-16425&lt;/del&gt;&lt;/a&gt; tests: skip interop recovery-small/144a/144b&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 64faf832a6128cc55c0f3ffa0595d9715d3bdd25&lt;/p&gt;</comment>
                            <comment id="403147" author="adilger" created="Thu, 8 Feb 2024 07:32:21 +0000"  >&lt;p&gt;Please use &quot;Resolved&quot; instead of &quot;Closed&quot; for closing tickets, so that they can still be modified afterward.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="37977">LU-8367</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="69587">LU-15724</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                                        </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i038jr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>