<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:30:20 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-9904] LNetError: 16885:0:(peer.c:1786:lnet_peer_push_event()) Push Put from unknown 0@&lt;0:0&gt; (source 0@&lt;0:0&gt;)</title>
                <link>https://jira.whamcloud.com/browse/LU-9904</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;New error seen during test on el6.9.   Not seen before.  Seen during lustre_rmmod every time.&lt;/p&gt;

&lt;p&gt;Suspect due to recent landings on master.&lt;/p&gt;</description>
                <environment></environment>
        <key id="47913">LU-9904</key>
            <summary>LNetError: 16885:0:(peer.c:1786:lnet_peer_push_event()) Push Put from unknown 0@&lt;0:0&gt; (source 0@&lt;0:0&gt;)</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="ashehata">Amir Shehata</assignee>
                                    <reporter username="bogl">Bob Glossman</reporter>
                        <labels>
                    </labels>
                <created>Tue, 22 Aug 2017 22:19:52 +0000</created>
                <updated>Sat, 30 Sep 2017 06:53:25 +0000</updated>
                            <resolved>Sat, 30 Sep 2017 04:48:21 +0000</resolved>
                                                    <fixVersion>Lustre 2.11.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="206079" author="ashehata" created="Tue, 22 Aug 2017 22:22:08 +0000"  >&lt;p&gt;I&apos;ll investigate.&lt;/p&gt;</comment>
                            <comment id="206253" author="ashehata" created="Thu, 24 Aug 2017 14:40:25 +0000"  >&lt;p&gt;This could occur when there is a shutdown. Basically, there is a new mechanism now where events are pushed to the peers whenever there is a local network interface change. During shutdown, everything is being removed. So that&apos;s detected as a change. and some pushes might make it out. When an event is received for that push message the peer is looked up but because of the shutdown it would&apos;ve been removed, and that error is printed out. We can probably suppress this error when LNet is shutting down. There are no other negative consequences indicated by this message.&lt;/p&gt;</comment>
                            <comment id="206255" author="bogl" created="Thu, 24 Aug 2017 14:44:36 +0000"  >&lt;p&gt;Your explanation sounds quite plausible.  I think it would be a very good idea to suppress such errors during shutdown.  As it is it looks quite alarming and happens at least once on every shutdown, at least for me.&lt;/p&gt;</comment>
                            <comment id="206263" author="ashehata" created="Thu, 24 Aug 2017 15:15:25 +0000"  >&lt;p&gt;sure. I&apos;ll push in a patch.&lt;/p&gt;</comment>
                            <comment id="206371" author="ashehata" created="Fri, 25 Aug 2017 00:52:31 +0000"  >&lt;p&gt;found a set of steps to reproduce without shutdown:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;peer 2:
modprobe lnet
lnetctl lnet configure
lnetctl net add --net tcp --&lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; eth0,eth1

peer1
modprobe lnet
lnetctl lnet configure
lnetctl net add --net tcp --&lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; eth0,eth1
lnetctl discover 192.168.122.30@tcp # discover peer2
# in /&lt;span class=&quot;code-keyword&quot;&gt;var&lt;/span&gt;/log/messages
# Aug 24 17:49:54 MRtest01 kernel: LNetError: 3447:0:(peer.c:1786:lnet_peer_push_event()) Push Put from unknown 0@&amp;lt;0:0&amp;gt; (source 0@&amp;lt;0:0&amp;gt;)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="208475" author="adilger" created="Fri, 15 Sep 2017 05:31:03 +0000"  >&lt;p&gt;I&apos;ve started hitting this after a recent update as well.  We definitely shouldn&apos;t be printing &quot;Error&quot; on the console for something that happens during normal operation.  I&apos;m also seeing a new error during mount:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# sh sanity.sh
client: executing check_logdir /tmp/test_logs/1505452045
client: ../libcfs/libcfs/libcfs options: &apos;libcfs_panic_on_lbug=0&apos;
Logging to shared log directory: /tmp/test_logs/1505452045
client: executing yml_node
IOC_LIBCFS_GET_NI error 22: Invalid argument
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;The mount itself continues fine, but as with the other error, we shouldn&apos;t be printing errors to the console/terminal during normal operations, as that tends to confuse users.&lt;/p&gt;</comment>
                            <comment id="208547" author="gerrit" created="Fri, 15 Sep 2017 23:55:09 +0000"  >&lt;p&gt;Amir Shehata (amir.shehata@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/29026&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/29026&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9904&quot; title=&quot;LNetError: 16885:0:(peer.c:1786:lnet_peer_push_event()) Push Put from unknown 0@&amp;lt;0:0&amp;gt; (source 0@&amp;lt;0:0&amp;gt;)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9904&quot;&gt;&lt;del&gt;LU-9904&lt;/del&gt;&lt;/a&gt; lnet: reduce logging severity&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 0732d936aa07e8ee129829e738b82f10189cd7ce&lt;/p&gt;</comment>
                            <comment id="208548" author="ashehata" created="Fri, 15 Sep 2017 23:58:32 +0000"  >&lt;p&gt;Andreas, the reason for &lt;br/&gt;
IOC_LIBCFS_GET_NI error 22: Invalid argument&lt;br/&gt;
is because an lctl list_nids is being called before the modules are loaded&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;testvm.centos7: executing check_logdir /tmp/test_logs/1505518717
Logging to shared log directory: /tmp/test_logs/1505518717
testvm.centos7: executing yml_node
IOC_LIBCFS_GET_NI error 22: Invalid argument &amp;lt;----- call to lctl list_nids
Client: Lustre version: 2.10.52_98_g8e75219_dirty
MDS: Lustre version: 2.10.52_98_g8e75219_dirty
OSS: Lustre version: 2.10.52_98_g8e75219_dirty
Stopping clients: testvm.centos7 /mnt/lustre (opts:)
Stopping clients: testvm.centos7 /mnt/lustre2 (opts:)
Loading modules from /usr/lib64/lustre &amp;lt;--- modules (including lnet) are loaded
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="208572" author="adilger" created="Sat, 16 Sep 2017 10:37:06 +0000"  >&lt;p&gt;I would suggest that &lt;tt&gt;IOC_LIBCFS_GET_NI error 22: Invalid argument&lt;/tt&gt; is not a useful error to print if &lt;tt&gt;lctl list_nids&lt;/tt&gt; failed, so that should be fixed up somehow.&lt;/p&gt;

&lt;p&gt;Secondly, I don&apos;t see where &lt;tt&gt;lctl list_nids&lt;/tt&gt; is being called, or I&apos;d suggest to avoid calling it if that doesn&apos;t make sense.  The only places I see it are in &lt;tt&gt;sk_nodemap_setup()&lt;/tt&gt;, which is only called if &lt;tt&gt;$SK_S2S&lt;/tt&gt; is set, and in &lt;tt&gt;host_nids_address()&lt;/tt&gt; which is only &lt;tt&gt;sanity.sh::test_217&lt;/tt&gt; and not during mount that I can see.&lt;/p&gt;</comment>
                            <comment id="208707" author="ashehata" created="Mon, 18 Sep 2017 23:45:10 +0000"  >&lt;p&gt;yaml.sh:yml_node_info() gets called before the modules are loaded. in this function&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;&lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; nw in $(lctl list_nids | grep -v @lo | cut -f 2 -d &lt;span class=&quot;code-quote&quot;&gt;&apos;@&apos;&lt;/span&gt; | uniq); &lt;span class=&quot;code-keyword&quot;&gt;do&lt;/span&gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This doesn&apos;t look like it&apos;s something new. I&apos;m not sure exactly how the test framework works to make a change there.&lt;/p&gt;

&lt;p&gt;I would rather not remove the error when list_nids fails, because it&apos;s useful for debugging. prints out why it failed. I think it makes more sense not to call lctl list_nids from the test unless the modules are loaded first.&lt;/p&gt;</comment>
                            <comment id="209149" author="adilger" created="Thu, 21 Sep 2017 22:55:31 +0000"  >&lt;p&gt;I&apos;d be happy if you fixed the test script to not call &lt;tt&gt;list_nids&lt;/tt&gt; before the modules are loaded.&lt;/p&gt;

&lt;p&gt;Even so, the error message itself doesn&apos;t explain anything to the user who runs &quot;&lt;tt&gt;lctl list_nids&lt;/tt&gt;&quot;.  I&apos;m not suggesting the error should be removed, but rather that it should be improved to be actually useful to the user:&lt;/p&gt;
&lt;ul class=&quot;alternate&quot; type=&quot;square&quot;&gt;
	&lt;li&gt;include &lt;tt&gt;lctl list_nids:&lt;/tt&gt; at the start, so the reader knows which command is failing&lt;/li&gt;
	&lt;li&gt;expand the message for EINVAL to suggest that the lnet module is not loaded&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="210020" author="gerrit" created="Sat, 30 Sep 2017 04:41:25 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/29026/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/29026/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9904&quot; title=&quot;LNetError: 16885:0:(peer.c:1786:lnet_peer_push_event()) Push Put from unknown 0@&amp;lt;0:0&amp;gt; (source 0@&amp;lt;0:0&amp;gt;)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9904&quot;&gt;&lt;del&gt;LU-9904&lt;/del&gt;&lt;/a&gt; lnet: reduce logging severity&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 7fc8037d61b29fa2ac93ab5fb30fccd9b1c0066c&lt;/p&gt;</comment>
                            <comment id="210028" author="pjones" created="Sat, 30 Sep 2017 04:48:21 +0000"  >&lt;p&gt;Landed for 2.11.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="45981">LU-9480</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzziuf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>