<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:53:04 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-12493] Bug when importing peer yaml; Panic/hang on cleanup afterwards</title>
                <link>https://jira.whamcloud.com/browse/LU-12493</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;I see errors when importing peer yaml that I don&apos;t understand.&lt;/p&gt;

&lt;p&gt;here&apos;s the test:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;sles15build01:~ # bash -x /bin/clean.sh
+ LUSTRE=/home/hornc/lustre-filesystem
+ LNETCTL=/home/hornc/lustre-filesystem/lnet/utils/lnetctl
+ /home/hornc/lustre-filesystem/lnet/utils/lnetctl lnet unconfigure
opening /dev/lnet failed: No such file or directory
hint: the kernel modules may not be loaded
unconfigure:
    - lnet:
          errno: -2
          descr: &quot;LNet unconfigure error: No such file or directory&quot;
+ rmmod /home/hornc/lustre-filesystem/lnet/klnds/socklnd/ksocklnd.ko
rmmod: ERROR: Module ksocklnd is not currently loaded
+ rmmod /home/hornc/lustre-filesystem/lnet/lnet/lnet.ko
rmmod: ERROR: Module lnet is not currently loaded
+ rmmod /home/hornc/lustre-filesystem/libcfs/libcfs/libcfs.ko
rmmod: ERROR: Module libcfs is not currently loaded
sles15build01:~ # bash -x /bin/start.sh
+ LUSTRE=/home/hornc/lustre-filesystem
+ LNETCTL=/home/hornc/lustre-filesystem/lnet/utils/lnetctl
+ insmod /home/hornc/lustre-filesystem/libcfs/libcfs/libcfs.ko
+ insmod /home/hornc/lustre-filesystem/lnet/lnet/lnet.ko
+ insmod /home/hornc/lustre-filesystem/lnet/klnds/socklnd/ksocklnd.ko
+ /home/hornc/lustre-filesystem/lnet/utils/lnetctl lnet configure
sles15build01:~ # cat /tmp/t.txt
peer:
    - primary nid: 1.1.1.1@o2ib
      Multi-Rail: False
      peer ni:
        - nid: 1.1.1.1@o2ib
        - nid: 2.2.2.2@tcp
        - nid: 3.3.3.3@tcp
        - nid: 4.4.4.4@o2ib
        - nid: 5.5.5.5@o2ib
        - nid: 6.6.6.6@tcp
        - nid: 7.7.7.7@tcp
        - nid: 8.8.8.8@o2ib
    - primary nid: 9.9.9.9@o2ib
      Multi-Rail: True
      peer ni:
        - nid: 9.9.9.9@o2ib
        - nid: 10.10.10.10@o2ib
        - nid: 11.11.11.11@o2ib
        - nid: 12.12.12.12@o2ib
        - nid: 13.13.13.13@tcp
        - nid: 14.14.14.14@o2ib
        - nid: 15.15.15.15@tcp
        - nid: 16.16.16.16@o2ib
    - primary nid: 17.17.17.17@o2ib
      Multi-Rail: True
      peer ni:
        - nid: 17.17.17.17@o2ib
        - nid: 18.18.18.18@o2ib
        - nid: 19.19.19.19@o2ib
        - nid: 20.20.20.20@tcp
        - nid: 21.21.21.21@o2ib
        - nid: 22.22.22.22@o2ib
        - nid: 23.23.23.23@tcp
        - nid: 24.24.24.24@o2ib
    - primary nid: 25.25.25.25@tcp
      Multi-Rail: False
      peer ni:
        - nid: 25.25.25.25@tcp
        - nid: 26.26.26.26@o2ib
        - nid: 27.27.27.27@o2ib
        - nid: 28.28.28.28@tcp
        - nid: 29.29.29.29@o2ib
        - nid: 30.30.30.30@tcp
        - nid: 31.31.31.31@o2ib
        - nid: 32.32.32.32@tcp
    - primary nid: 33.33.33.33@tcp
      Multi-Rail: False
      peer ni:
        - nid: 33.33.33.33@tcp
        - nid: 34.34.34.34@o2ib
        - nid: 35.35.35.35@tcp
        - nid: 36.36.36.36@o2ib
        - nid: 37.37.37.37@o2ib
        - nid: 38.38.38.38@tcp
        - nid: 39.39.39.39@o2ib
        - nid: 40.40.40.40@o2ib
sles15build01:~ # /home/hornc/lustre-filesystem/lnet/utils/lnetctl import &amp;lt; /tmp/t.txt
add:
    - peer_ni:
          errno: -76
          descr: &quot;cannot add peer ni: Name not unique on network&quot;
    - peer_ni:
          errno: 0
          descr: &quot;Success&quot;
    - peer_ni:
          errno: 0
          descr: &quot;Success&quot;
    - peer_ni:
          errno: -76
          descr: &quot;cannot add peer ni: Name not unique on network&quot;
    - peer_ni:
          errno: -76
          descr: &quot;cannot add peer ni: Name not unique on network&quot;
sles15build01:~ #
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Every nid in the file is unique.&lt;/p&gt;

&lt;p&gt;Trying to cleanup after doing the above and the node either hangs or crashes:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;sles15build01:~ # bash -x /bin/clean.sh
+ LUSTRE=/home/hornc/lustre-filesystem
+ LNETCTL=/home/hornc/lustre-filesystem/lnet/utils/lnetctl
+ /home/hornc/lustre-filesystem/lnet/utils/lnetctl lnet unconfigure
^^Hangs
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I haven&apos;t been able to get a crash dump.&lt;/p&gt;

&lt;p&gt;Seen with 2.13 but I&apos;d bet money it affects 2.10+&lt;/p&gt;</description>
                <environment></environment>
        <key id="56230">LU-12493</key>
            <summary>Bug when importing peer yaml; Panic/hang on cleanup afterwards</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="hornc">Chris Horn</reporter>
                        <labels>
                    </labels>
                <created>Sat, 29 Jun 2019 18:59:41 +0000</created>
                <updated>Sat, 29 Jun 2019 19:29:50 +0000</updated>
                                            <version>Lustre 2.13.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>1</watches>
                                                                            <comments>
                            <comment id="250370" author="hornc" created="Sat, 29 Jun 2019 19:26:35 +0000"  >&lt;p&gt;Ah, we&apos;re hitting this code:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;        /*
         * Get the peer_net. Check that we&apos;re not adding a second
         * peer_ni on a peer_net of a non-multi-rail peer.
         */
        lpn = lnet_peer_get_net_locked(lp, LNET_NIDNET(nid));
        if (!lpn) {
                lpn = lnet_peer_net_alloc(LNET_NIDNET(nid));
                if (!lpn) {
                        rc = -ENOMEM;
                        goto out_free_lpni;
                }
        } else if (!(lp-&amp;gt;lp_state &amp;amp; LNET_PEER_MULTI_RAIL)) {
                rc = -ENOTUNIQ;
                goto out_free_lpni;
        }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Would be nice to have a better error message. Still not sure why we&apos;re hanging/crashing on cleanup.&lt;/p&gt;</comment>
                            <comment id="250371" author="hornc" created="Sat, 29 Jun 2019 19:29:04 +0000"  >&lt;p&gt;So if we&apos;re supposed to be prevented from adding secondary nids to non-MR peers then that doesn&apos;t seem to be working correctly:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;sles15build01:/home/hornc/lustre-filesystem/lustre/tests # cat /tmp/t.txt
peer:
    - primary nid: 1.1.1.1@o2ib
      Multi-Rail: False
      peer ni:
        - nid: 1.1.1.1@o2ib
        - nid: 2.2.2.2@tcp
        - nid: 3.3.3.3@tcp
        - nid: 4.4.4.4@o2ib
        - nid: 5.5.5.5@o2ib
        - nid: 6.6.6.6@tcp
        - nid: 7.7.7.7@tcp
        - nid: 8.8.8.8@o2ib
    - primary nid: 9.9.9.9@o2ib
      Multi-Rail: True
      peer ni:
        - nid: 9.9.9.9@o2ib
        - nid: 10.10.10.10@o2ib
        - nid: 11.11.11.11@o2ib
        - nid: 12.12.12.12@o2ib
        - nid: 13.13.13.13@tcp
        - nid: 14.14.14.14@o2ib
        - nid: 15.15.15.15@tcp
        - nid: 16.16.16.16@o2ib
    - primary nid: 17.17.17.17@o2ib
      Multi-Rail: True
      peer ni:
        - nid: 17.17.17.17@o2ib
        - nid: 18.18.18.18@o2ib
        - nid: 19.19.19.19@o2ib
        - nid: 20.20.20.20@tcp
        - nid: 21.21.21.21@o2ib
        - nid: 22.22.22.22@o2ib
        - nid: 23.23.23.23@tcp
        - nid: 24.24.24.24@o2ib
    - primary nid: 25.25.25.25@tcp
      Multi-Rail: False
      peer ni:
        - nid: 25.25.25.25@tcp
        - nid: 26.26.26.26@o2ib
        - nid: 27.27.27.27@o2ib
        - nid: 28.28.28.28@tcp
        - nid: 29.29.29.29@o2ib
        - nid: 30.30.30.30@tcp
        - nid: 31.31.31.31@o2ib
        - nid: 32.32.32.32@tcp
    - primary nid: 33.33.33.33@tcp
      Multi-Rail: False
      peer ni:
        - nid: 33.33.33.33@tcp
        - nid: 34.34.34.34@o2ib
        - nid: 35.35.35.35@tcp
        - nid: 36.36.36.36@o2ib
        - nid: 37.37.37.37@o2ib
        - nid: 38.38.38.38@tcp
        - nid: 39.39.39.39@o2ib
        - nid: 40.40.40.40@o2ib
sles15build01:/home/hornc/lustre-filesystem/lustre/tests # lnetctl import &amp;lt; /tmp/t.txt
add:
    - peer_ni:
          errno: -76
          descr: &quot;cannot add peer ni: Name not unique on network&quot;
    - peer_ni:
          errno: 0
          descr: &quot;Success&quot;
    - peer_ni:
          errno: 0
          descr: &quot;Success&quot;
    - peer_ni:
          errno: -76
          descr: &quot;cannot add peer ni: Name not unique on network&quot;
    - peer_ni:
          errno: -76
          descr: &quot;cannot add peer ni: Name not unique on network&quot;
sles15build01:/home/hornc/lustre-filesystem/lustre/tests # lnetctl peer show
peer:
    - primary nid: 25.25.25.25@tcp
      Multi-Rail: False
      peer ni:
        - nid: 25.25.25.25@tcp
          state: NA
        - nid: 26.26.26.26@o2ib
          state: NA
    - primary nid: 9.9.9.9@o2ib
      Multi-Rail: True
      peer ni:
        - nid: 9.9.9.9@o2ib
          state: NA
        - nid: 10.10.10.10@o2ib
          state: NA
        - nid: 11.11.11.11@o2ib
          state: NA
        - nid: 12.12.12.12@o2ib
          state: NA
        - nid: 14.14.14.14@o2ib
          state: NA
        - nid: 16.16.16.16@o2ib
          state: NA
        - nid: 13.13.13.13@tcp
          state: NA
        - nid: 15.15.15.15@tcp
          state: NA
    - primary nid: 1.1.1.1@o2ib
      Multi-Rail: False
      peer ni:
        - nid: 1.1.1.1@o2ib
          state: NA
        - nid: 2.2.2.2@tcp
          state: NA
    - primary nid: 17.17.17.17@o2ib
      Multi-Rail: True
      peer ni:
        - nid: 17.17.17.17@o2ib
          state: NA
        - nid: 18.18.18.18@o2ib
          state: NA
        - nid: 19.19.19.19@o2ib
          state: NA
        - nid: 21.21.21.21@o2ib
          state: NA
        - nid: 22.22.22.22@o2ib
          state: NA
        - nid: 24.24.24.24@o2ib
          state: NA
        - nid: 20.20.20.20@tcp
          state: NA
        - nid: 23.23.23.23@tcp
          state: NA
    - primary nid: 33.33.33.33@tcp
      Multi-Rail: False
      peer ni:
        - nid: 33.33.33.33@tcp
          state: NA
        - nid: 34.34.34.34@o2ib
          state: NA
sles15build01:/home/hornc/lustre-filesystem/lustre/tests #
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00iyf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>