<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:07:46 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14207] Replace_nids left old nids in add_conn field of failnid section of client llog</title>
                <link>https://jira.whamcloud.com/browse/LU-14207</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;OST doesn&apos;t start after replace_nids&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
00000020:01000004:19.0:1602101845.630802:0:58310:0:(obd_mount.c:193:lustre_start_simple()) Starting obd cslmo7fs-MDT0000-lwp-OST0001 (typ=lwp)
00000020:00000080:19.0:1602101845.630804:0:58310:0:(obd_config.c:1128:class_process_config()) processing cmd: cf001
00000020:00000080:19.0:1602101845.630811:0:58310:0:(genops.c:451:class_newdev()) Allocate &lt;span class=&quot;code-keyword&quot;&gt;new&lt;/span&gt; device cslmo7fs-MDT0000-lwp-OST0001 (ffff9a88fc608000)
00000020:00000080:19.0:1602101845.630854:0:58310:0:(obd_config.c:431:class_attach()) OBD: dev 4 attached type lwp with refcount 1
00000020:00000080:19.0:1602101845.630855:0:58310:0:(obd_config.c:1128:class_process_config()) processing cmd: cf003
00010000:00080000:19.0:1602101845.630919:0:58310:0:(ldlm_lib.c:115:import_set_conn()) imp ffff9a88fc610000@cslmo7fs-MDT0000-lwp-OST0001: add connection 172.17.8.53@o2ib at head
00000020:00000080:19.0:1602101845.631562:0:58310:0:(obd_config.c:538:class_setup()) finished setup of obd cslmo7fs-MDT0000-lwp-OST0001 (uuid cslmo7fs-MDT0000-lwp-OST0001_UUID)
00000010:01000000:19.0:1602101845.631571:0:58310:0:(lwp_dev.c:504:lwp_obd_connect()) connect #0
00000020:00000080:19.0:1602101845.631575:0:58310:0:(genops.c:1421:class_connect()) connect: client cslmo7fs-MDT0000-lwp-OST0001, cookie 0xf1eaeee46a1899ae
00000100:00080000:19.0:1602101845.631579:0:58310:0:(&lt;span class=&quot;code-keyword&quot;&gt;import&lt;/span&gt;.c:543:import_select_connection()) cslmo7fs-MDT0000-lwp-OST0001: connect to NID 172.17.8.53@o2ib last attempt 0
00000100:00080000:19.0:1602101845.631581:0:58310:0:(&lt;span class=&quot;code-keyword&quot;&gt;import&lt;/span&gt;.c:619:import_select_connection()) cslmo7fs-MDT0000-lwp-OST0001: &lt;span class=&quot;code-keyword&quot;&gt;import&lt;/span&gt; ffff9a88fc610000 using connection 172.17.8.53@o2ib/172.17.8.53@o2ib
00000100:00080000:19.0:1602101845.631595:0:58310:0:(pinger.c:376:ptlrpc_pinger_add_import()) adding pingable &lt;span class=&quot;code-keyword&quot;&gt;import&lt;/span&gt; cslmo7fs-MDT0000-lwp-OST0001_UUID-&amp;gt;cslmo7fs-MDT0000_UUID
00010000:00080000:19.0:1602101845.631661:0:58310:0:(ldlm_lib.c:115:import_set_conn()) imp ffff9a88fc610000@cslmo7fs-MDT0000-lwp-OST0001: add connection 172.17.8.52@o2ib at tail
00000100:00000100:19.0:1602101845.631669:0:58310:0:(client.c:97:ptlrpc_uuid_to_connection()) cannot find peer 172.17.7.52@o2ib!
00000100:00080000:11.0F:1602101845.631670:0:58313:0:(client.c:1631:ptlrpc_send_new_req()) @@@ req waiting &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; recovery: (FULL != CONNECTING)  req@ffff9a8e57656300 x1679925143670144/t0(0) o901-&amp;gt;cslmo7fs-MDT0000-lwp-OST0001@172.17.8.53@o2ib:29/10 lens 248/4320 e 0 to 0 dl 0 ref 2 fl Rpc:W/0/ffffffff rc 0/-1 job:&apos;&apos;
00010000:00080000:19.0:1602101845.641922:0:58310:0:(ldlm_lib.c:77:import_set_conn()) can&apos;t find connection 172.17.7.52@o2ib
00000020:00020000:19.0:1602101845.641924:0:58310:0:(obd_mount_server.c:769:lustre_lwp_add_conn()) cslmo7fs-MDT0000-lwp-OST0001: can&apos;t add conn: rc = -2
00000040:00080000:19.0:1602101845.655437:0:58310:0:(llog.c:713:llog_process_thread()) stop processing plain 0x4c:10:0 index 42 count 60
00000020:01000000:7.0:1602101845.655451:0:58201:0:(obd_config.c:1876:class_config_parse_llog()) Processed log cslmo7fs-client gen 1-42 (rc=-2)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;There are old nids (172.17.7.) in cslmo7fs-client llog. New ones 172.17.8.&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;

#36 (224)marker  15 (flags=0x01, v2.12.4.2) cslmo7fs-OST0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:20 2020-
#37 (088)add_uuid  nid=172.17.8.54@o2ib(0x50000ac110836)  0:  1:172.17.8.54@o2ib  
#38 (112)add_conn  0:cslmo7fs-OST0000-osc  1:172.17.7.55@o2ib  
#39 (224)END   marker  15 (flags=0x02, v2.12.4.2) cslmo7fs-OST0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:20 2020-
#40 (224)marker  18 (flags=0x01, v2.12.4.2) cslmo7fs-MDT0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:23 2020-
#41 (088)add_uuid  nid=172.17.8.53@o2ib(0x50000ac110835)  0:  1:172.17.8.53@o2ib  
#42 (112)add_conn  0:cslmo7fs-MDT0000-mdc  1:172.17.7.52@o2ib  
#43 (224)END   marker  18 (flags=0x02, v2.12.4.2) cslmo7fs-MDT0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:23 2020-
#44 (224)marker  19 (flags=0x01, v2.12.4.2) cslmo7fs-OST0001 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:26 2020-
#45 (088)add_uuid  nid=172.17.8.55@o2ib(0x50000ac110837)  0:  1:172.17.8.55@o2ib  
#46 (112)add_conn  0:cslmo7fs-OST0001-osc  1:172.17.7.54@o2ib  
#47 (224)END   marker  19 (flags=0x02, v2.12.4.2) cslmo7fs-OST0001 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:26 2020-
#48 (224)marker  20 (flags=0x01, v2.12.4.2) cslmo7fs-OST0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:16:54 2020-
#49 (088)add_uuid  nid=172.17.8.55@o2ib(0x50000ac110837)  0:  1:172.17.8.55@o2ib  
#50 (112)add_conn  0:cslmo7fs-OST0000-osc  1:172.17.8.55@o2ib  
#51 (224)END   marker  20 (flags=0x02, v2.12.4.2) cslmo7fs-OST0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:16:54 2020-
#53 (224)marker  23 (flags=0x01, v2.12.4.2) cslmo7fs-MDT0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:16:54 2020-
#54 (088)add_uuid  nid=172.17.8.52@o2ib(0x50000ac110834)  0:  1:172.17.8.52@o2ib  
#55 (112)add_conn  0:cslmo7fs-MDT0000-mdc  1:172.17.8.52@o2ib  
#56 (224)END   marker  23 (flags=0x02, v2.12.4.2) cslmo7fs-MDT0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:16:54 2020-
#57 (224)marker  24 (flags=0x01, v2.12.4.2) cslmo7fs-OST0001 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:17:14 2020-
#58 (088)add_uuid  nid=172.17.8.54@o2ib(0x50000ac110836)  0:  1:172.17.8.54@o2ib  
#59 (112)add_conn  0:cslmo7fs-OST0001-osc  1:172.17.8.54@o2ib  
#60 (224)END   marker  24 (flags=0x02, v2.12.4.2) cslmo7fs-OST0001 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:17:14 2020-
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Commands like that &quot;--erase-param failover.node --param failover.node=172.17.5.52@o2ib&quot; adds sections to the llog files.&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
#36 (224)marker  15 (flags=0x01, v2.12.4.2) cslmo7fs-OST0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:20 2020-
#37 (088)add_uuid  nid=172.17.8.54@o2ib(0x50000ac110836)  0:  1:172.17.8.54@o2ib  
#38 (112)add_conn  0:cslmo7fs-OST0000-osc  1:172.17.7.55@o2ib  
#39 (224)END   marker  15 (flags=0x02, v2.12.4.2) cslmo7fs-OST0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:20 2020-
#40 (224)marker  18 (flags=0x01, v2.12.4.2) cslmo7fs-MDT0000 &lt;span class=&quot;code-quote&quot;&gt;&apos;add failnid&apos;&lt;/span&gt; Wed Oct  7 20:04:23 2020-
lctl replace_nids processes &lt;span class=&quot;code-quote&quot;&gt;&quot;add failnid&quot;&lt;/span&gt; section bugously. Change &lt;span class=&quot;code-quote&quot;&gt;&quot;add_uuid&quot;&lt;/span&gt; but leave add_conn as is.
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This should be fixed in replace_nids code.&lt;/p&gt;

&lt;p&gt;As workaround I suggest exclude &quot;--erase-param failover.node --param failover.node=172.17.5.52@o2ib&quot; parameters from scripts. They are duplicated by replace_nids command like:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
lctl replace_nids cslmo7fs-OST0001 172.17.4.56@o2ib:172.17.4.54@o2ib
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;failove is placed after &quot;:&quot; here.&lt;/p&gt;</description>
                <environment></environment>
        <key id="61940">LU-14207</key>
            <summary>Replace_nids left old nids in add_conn field of failnid section of client llog</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="artem_blagodarenko">Artem Blagodarenko</assignee>
                                    <reporter username="artem_blagodarenko">Artem Blagodarenko</reporter>
                        <labels>
                            <label>patch</label>
                    </labels>
                <created>Thu, 10 Dec 2020 08:52:34 +0000</created>
                <updated>Fri, 26 Feb 2021 21:14:09 +0000</updated>
                            <resolved>Fri, 26 Feb 2021 21:14:09 +0000</resolved>
                                                    <fixVersion>Lustre 2.15.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="287183" author="gerrit" created="Thu, 10 Dec 2020 09:10:42 +0000"  >&lt;p&gt;Artem Blagodarenko (artem.blagodarenko@hpe.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/40930&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/40930&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14207&quot; title=&quot;Replace_nids left old nids in add_conn field of failnid section of client llog&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14207&quot;&gt;&lt;del&gt;LU-14207&lt;/del&gt;&lt;/a&gt; mgs: delete &quot;add failnid&quot; sections on replace_nids&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: fa782a0ad3c32a6b3b3ab717255a508eab9fd84f&lt;/p&gt;</comment>
                            <comment id="293240" author="gerrit" created="Fri, 26 Feb 2021 20:13:26 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/40930/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/40930/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14207&quot; title=&quot;Replace_nids left old nids in add_conn field of failnid section of client llog&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14207&quot;&gt;&lt;del&gt;LU-14207&lt;/del&gt;&lt;/a&gt; mgs: delete &quot;add failnid&quot; sections on replace_nids&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 8910291fc5ca71588e865ac2ec3a7fbb881a7082&lt;/p&gt;</comment>
                            <comment id="293282" author="pjones" created="Fri, 26 Feb 2021 21:14:09 +0000"  >&lt;p&gt;Landed for 2.15&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01guf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>