<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:58:59 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-6296] insanity test_1: check_for_recovery_ready()) ASSERTION( clnts &lt;= obd-&gt;obd_max_recoverable_clients )</title>
                <link>https://jira.whamcloud.com/browse/LU-6296</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for wangdi &amp;lt;di.wang@intel.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/4636a65e-bd3a-11e4-8d85-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/4636a65e-bd3a-11e4-8d85-5254006e85c2&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;The sub-test test_1 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;test failed to respond and timed out
19:56:07:Lustre: Evicted from MGS (at 10.1.6.12@tcp) after server handle changed from 0xbe3c45f237bd6bdf to 0xbe3c45f237bd760b
19:56:07:LustreError: 19415:0:(ldlm_lib.c:1963:check_for_recovery_ready()) ASSERTION( clnts &amp;lt;= obd-&amp;gt;obd_max_recoverable_clients ) failed: 
19:56:07:LustreError: 19415:0:(ldlm_lib.c:1963:check_for_recovery_ready()) LBUG
19:56:07:Pid: 19415, comm: tgt_recov
19:56:07:
19:56:07:Call Trace:
19:56:07: [&amp;lt;ffffffffa0491895&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
19:56:07: [&amp;lt;ffffffffa0491e97&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
19:56:07: [&amp;lt;ffffffffa07cf9de&amp;gt;] check_for_recovery_ready+0x17e/0x180 [ptlrpc]
19:56:07: [&amp;lt;ffffffffa07cf860&amp;gt;] ? check_for_recovery_ready+0x0/0x180 [ptlrpc]
19:56:07: [&amp;lt;ffffffffa07d0f16&amp;gt;] target_recovery_overseer+0xd6/0x320 [ptlrpc]
19:56:07: [&amp;lt;ffffffffa07cf4b0&amp;gt;] ? exp_connect_healthy+0x0/0x20 [ptlrpc]
19:56:07: [&amp;lt;ffffffff8109eb00&amp;gt;] ? autoremove_wake_function+0x0/0x40
19:56:07: [&amp;lt;ffffffffa07d8274&amp;gt;] target_recovery_thread+0x5b4/0x1ad0 [ptlrpc]
19:56:07: [&amp;lt;ffffffff81064ba2&amp;gt;] ? default_wake_function+0x12/0x20
19:56:07: [&amp;lt;ffffffffa07d7cc0&amp;gt;] ? target_recovery_thread+0x0/0x1ad0 [ptlrpc]
19:56:07: [&amp;lt;ffffffff8109e66e&amp;gt;] kthread+0x9e/0xc0
19:56:07: [&amp;lt;ffffffff8100c20a&amp;gt;] child_rip+0xa/0x20
19:56:07: [&amp;lt;ffffffff8109e5d0&amp;gt;] ? kthread+0x0/0xc0
19:56:07: [&amp;lt;ffffffff8100c200&amp;gt;] ? child_rip+0x0/0x20
19:56:07:
19:56:07:Kernel panic - not syncing: LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Please provide additional information about the failure here.&lt;/p&gt;

&lt;p&gt;Info required for matching: insanity 1&lt;/p&gt;</description>
                <environment></environment>
        <key id="28862">LU-6296</key>
            <summary>insanity test_1: check_for_recovery_ready()) ASSERTION( clnts &lt;= obd-&gt;obd_max_recoverable_clients )</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="di.wang">Di Wang</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                            <label>dne2</label>
                    </labels>
                <created>Thu, 26 Feb 2015 00:29:19 +0000</created>
                <updated>Fri, 9 Sep 2016 20:14:53 +0000</updated>
                            <resolved>Fri, 27 Feb 2015 05:07:04 +0000</resolved>
                                    <version>Lustre 2.8.0</version>
                                    <fixVersion>Lustre 2.8.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="108196" author="di.wang" created="Fri, 27 Feb 2015 05:03:16 +0000"  >&lt;p&gt;It seems obd_max_recoverable_clients should be updated when new MDS-MDS exports are created. This patch should fix the problem&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;diff --git a/lustre/ldlm/ldlm_lib.c b/lustre/ldlm/ldlm_lib.c
index f1b8faf..7388e6c 100644
--- a/lustre/ldlm/ldlm_lib.c
+++ b/lustre/ldlm/ldlm_lib.c
@@ -1172,8 +1172,7 @@ dont_check_exports:
                              &amp;amp;export-&amp;gt;exp_nid_hash);
         }

-       if (target-&amp;gt;obd_recovering &amp;amp;&amp;amp; !export-&amp;gt;exp_in_recovery &amp;amp;&amp;amp; !lw_client &amp;amp;&amp;amp;
-           !new_mds_mds_conn) {
+       if (target-&amp;gt;obd_recovering &amp;amp;&amp;amp; !export-&amp;gt;exp_in_recovery &amp;amp;&amp;amp; !lw_client) {
                 int has_transno;
                 __u64 transno = data-&amp;gt;ocd_transno;

@@ -1206,6 +1205,14 @@ dont_check_exports:

                atomic_inc(&amp;amp;target-&amp;gt;obd_req_replay_clients);
                atomic_inc(&amp;amp;target-&amp;gt;obd_lock_replay_clients);
+               /* Note: MDS-MDS connection is allowed to be connected during
+                * recovery, no matter if the exports needs to be recoveried.
+                * Because we need retrieve updates logs from all other MDTs.
+                * So if the MDS-MDS export is new, obd_max_recoverable_clients
+                * also needs to be increased to match other recovery checking
+                * condition. */
+               if (new_mds_mds_conn)
+                       target-&amp;gt;obd_max_recoverable_clients++;
                if (atomic_inc_return(&amp;amp;target-&amp;gt;obd_connected_clients) ==
                    target-&amp;gt;obd_max_recoverable_clients)
                        wake_up(&amp;amp;target-&amp;gt;obd_next_transno_waitq);
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="108197" author="di.wang" created="Fri, 27 Feb 2015 05:06:58 +0000"  >&lt;p&gt;I will add this patch to &lt;a href=&quot;http://review.whamcloud.com/#/c/11737/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/11737/&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="19630">LU-3534</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzx75r:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>17630</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>