<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:05:48 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-13976] duplicate IB_WR_LOCAL_INV causing ice driver failure (RoCE/iWarp)</title>
                <link>https://jira.whamcloud.com/browse/LU-13976</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;During lnet_selftest read &amp;gt; 4K (write works without this issue), the ice driver detects a duplicate IB_WR_LOCAL_INV on the same key and the test fails. We also cannot mount a file system over Lustre because of this issue.&lt;/p&gt;

&lt;p&gt;We instrumented o2iblnd.c and the irdma driver and found the duplicate IB_WR_LOCAL_INV:&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;In this example below, skl01 is the client and skl02 is the server during a lst read operation.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&lt;b&gt;skl01, irdma trace:&lt;/b&gt;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:11:42 2020&amp;#93;&lt;/span&gt; MKI-irdma_create_stag: returning stag = 0xb16f427b&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:11:42 2020&amp;#93;&lt;/span&gt; LNet: Added LNI &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:192.168.1.1@o2ib&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;192.168.1.1@o2ib&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;8/256/0/180&amp;#93;&lt;/span&gt;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_LOCAL_INV rkey = 0x8e89e91b&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_REG_MR: ib_wr-&amp;gt;wr_id=0x4, reg_wr(ib_wr)-&amp;gt;key=0x8e89e91c, info.stag_key=0x1c, info.stag_idx=0x8e89e9&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:08 2020&amp;#93;&lt;/span&gt; ice 0000:18:00.0: abnormal ae_id = 0x50a bool qp=1 qp_id = 6&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:08 2020&amp;#93;&lt;/span&gt; LNetError: 4268:0:(o2iblnd_cb.c:3676:kiblnd_qp_event()) &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:192.168.1.2@o2ib&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;192.168.1.2@o2ib&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt;: Async QP event type 1&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:08 2020&amp;#93;&lt;/span&gt; LustreError: 47768:0:(brw_test.c:344:brw_client_done_rpc()) BRW RPC to &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:12345-192.168.1.2@o2ib&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;12345-192.168.1.2@o2ib&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt; failed with -103&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&lt;b&gt;skl01, Lustre trace:&lt;/b&gt;&lt;/p&gt;
&lt;div class=&apos;table-wrap&apos;&gt;
&lt;table class=&apos;confluenceTable&apos;&gt;&lt;tbody&gt;
&lt;tr&gt;
&lt;td class=&apos;confluenceTd&apos;&gt;00000800:00000200:57.0:1600697647.117610:0:47619:0:(o2iblnd.c:1913:kiblnd_fmr_pool_map()) jpe key 8e89e91b&lt;br/&gt;
00000800:00000200:57.0:1600697647.117611:0:47619:0:(o2iblnd.c:1919:kiblnd_fmr_pool_map()) jpe key after bump 8e89e91c&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;&lt;/table&gt;
&lt;/div&gt;


&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&lt;b&gt;skl02, irdma trace:&lt;/b&gt;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:11:42 2020&amp;#93;&lt;/span&gt; MKI-irdma_create_stag: returning stag = 0x968276e9&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:11:42 2020&amp;#93;&lt;/span&gt; MKI-irdma_create_stag: returning stag = 0xd477355c&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:11:42 2020&amp;#93;&lt;/span&gt; LNet: Added LNI &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:192.168.1.2@o2ib&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;192.168.1.2@o2ib&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;8/256/0/180&amp;#93;&lt;/span&gt;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; LNet: 36382:0:(rpc.c:612:srpc_service_add_buffers()) waiting for adding buffer&lt;/p&gt;

&lt;p&gt;&lt;font color=&quot;#FF0000&quot;&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_LOCAL_INV rkey = 0x31172601&lt;/font&gt;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_REG_MR: ib_wr-&amp;gt;wr_id=0x4, reg_wr(ib_wr)-&amp;gt;key=0x31172602, info.stag_key=0x2, info.stag_idx=0x311726&lt;/p&gt;

&lt;p&gt;&lt;font color=&quot;#FF0000&quot;&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_LOCAL_INV rkey = 0x31172601&#160; &lt;span class=&quot;error&quot;&gt;&amp;#91;MKI&amp;#93;&lt;/span&gt; This key was already invalidated&lt;/font&gt;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_REG_MR: ib_wr-&amp;gt;wr_id=0x4, reg_wr(ib_wr)-&amp;gt;key=0x31172602, info.stag_key=0x2, info.stag_idx=0x311726&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; ice 0000:18:00.0: abnormal ae_id = 0x106 bool qp=1 qp_id = 4&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; LNetError: 36497:0:(o2iblnd_cb.c:3676:kiblnd_qp_event()) &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:192.168.1.1@o2ib&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;192.168.1.1@o2ib&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt;: Async QP event type 1&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:07 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_LOCAL_INV rkey = 0x76b95769&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:07 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_REG_MR: ib_wr-&amp;gt;wr_id=0x4, reg_wr(ib_wr)-&amp;gt;key=0x76b9576a, info.stag_key=0x6a, info.stag_idx=0x76b957&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:07 2020&amp;#93;&lt;/span&gt; LNet: 36261:0:(o2iblnd_cb.c:413:kiblnd_handle_rx()) PUT_NACK from &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:192.168.1.1@o2ib&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;192.168.1.1@o2ib&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&lt;b&gt;skl02, Lustre trace:&lt;/b&gt;&lt;/p&gt;
&lt;div class=&apos;table-wrap&apos;&gt;
&lt;table class=&apos;confluenceTable&apos;&gt;&lt;tbody&gt;
&lt;tr&gt;
&lt;td class=&apos;confluenceTd&apos;&gt;00000800:00000200:28.0:1600697647.441213:0:36436:0:(o2iblnd.c:1913:kiblnd_fmr_pool_map()) jpe key 31172601&lt;br/&gt;
00000800:00000200:28.0:1600697647.441215:0:36436:0:(o2iblnd.c:1919:kiblnd_fmr_pool_map()) jpe key after bump 31172602&lt;br/&gt;
00000800:00000200:59.0:1600697647.677998:0:36262:0:(o2iblnd.c:1913:kiblnd_fmr_pool_map()) jpe key 76b95769&lt;br/&gt;
00000800:00000200:59.0:1600697647.678000:0:36262:0:(o2iblnd.c:1919:kiblnd_fmr_pool_map()) jpe key after bump 76b9576a&lt;/td&gt;
&lt;/tr&gt;
&lt;/tbody&gt;&lt;/table&gt;
&lt;/div&gt;


&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_LOCAL_INV rkey = 0x31172601&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_REG_MR: ib_wr-&amp;gt;wr_id=0x4, reg_wr(ib_wr)-&amp;gt;key=0x31172602, info.stag_key=0x2, info.stag_idx=0x311726&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;The next line below is duplicate as rkey = 0x31172601 is already invalidated above. So, we think this should have been 0x31172602, that would avoid invalidating an already invalidated key, and also doing a duplicate REG_MR on the same key.&lt;/p&gt;

&lt;p&gt;Is there something else doing an invalidate somewhere in the code?&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_LOCAL_INV rkey = 0x31172601&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; MKI-IB_WR_REG_MR: ib_wr-&amp;gt;wr_id=0x4, reg_wr(ib_wr)-&amp;gt;key=0x31172602, info.stag_key=0x2, info.stag_idx=0x311726&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;Mon Sep 21 10:14:06 2020&amp;#93;&lt;/span&gt; ice 0000:18:00.0: abnormal ae_id = 0x106 bool qp=1 qp_id = 4&lt;/p&gt;</description>
                <environment>RHEL 8.1, Intel Corporation Ethernet Controller E810-C, iwarp or RoCE mode</environment>
        <key id="60888">LU-13976</key>
            <summary>duplicate IB_WR_LOCAL_INV causing ice driver failure (RoCE/iWarp)</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="jerwin">James Erwin</reporter>
                        <labels>
                    </labels>
                <created>Tue, 22 Sep 2020 12:57:29 +0000</created>
                <updated>Wed, 23 Mar 2022 12:54:31 +0000</updated>
                            <resolved>Wed, 23 Mar 2022 12:54:31 +0000</resolved>
                                    <version>Lustre 2.12.5</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="283229" author="jerwin" created="Mon, 26 Oct 2020 13:41:30 +0000"  >&lt;p&gt;Hello, is there any update on this issue?&#160;&lt;/p&gt;</comment>
                            <comment id="329655" author="mmarcini2" created="Fri, 18 Mar 2022 21:15:27 +0000"  >&lt;p&gt;I suspect this issue is a duplicate.&lt;/p&gt;</comment>
                            <comment id="329934" author="mmarcini2" created="Wed, 23 Mar 2022 12:14:44 +0000"  >&lt;p&gt;I have confirmed that a client build with off of the 2.12.8 branch doesn&apos;t see the issue.&lt;/p&gt;

&lt;p&gt;This is indeed a duplicate.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="64515">LU-14733</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01afr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>