<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:27:25 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16484] Linux kernel BUG when deleting and adding a peer and using a filesystem</title>
                <link>https://jira.whamcloud.com/browse/LU-16484</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Using a small 2-node cluster with 1 server and 1 client.&#160; On the client, I ran the following in loops in two windows:&lt;/p&gt;

&lt;p&gt;Window #1:&lt;/p&gt;

&lt;p&gt;&#160; &#160; &#160; &#160; lnetctl peer del --prim_nid $PEER&lt;br/&gt;
&#160; &#160; &#160; &#160; lnetctl peer add --prim_nid $PEER&lt;/p&gt;

&lt;p&gt;Where $PEER is the NID of the server&lt;/p&gt;

&lt;p&gt;Window #2:&lt;/p&gt;

&lt;p&gt;&#160; &#160; &#160; &#160; touch $BASE_DIR/qq&lt;br/&gt;
&#160; &#160; &#160; &#160; rm -f $BASE_DIR/*&lt;/p&gt;

&lt;p&gt;Where $BASE_DIR is a directory within a mounted Lustre file system from $PEER.&lt;/p&gt;

&lt;p&gt;Running either results in no issues.&#160; Running both at the same time results in a kernel BUG.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 8763.523887] list_add corruption. prev-&amp;gt;next should be next (ffff8e98555a72e0), but was ffff8e98056d2810. (prev=ffff8e98056d2810).
[ 8763.536952] ------------[ cut here ]------------
[ 8763.536953] kernel BUG at lib/list_debug.c:28!
[ 8763.541933] invalid opcode: 0000 [#1] SMP PTI
[ 8763.546809] CPU: 9 PID: 18262 Comm: lnet_discovery Kdump: loaded Tainted: G &#160; &#160; &#160; &#160; &#160; OE &#160; &#160;--------- - &#160;- 4.18.0-348.el8.0.2.x86_64 #1
[ 8763.560434] Hardware name: Intel Corporation S2600WT2/S2600WT2, BIOS SE5C610.86B.01.01.1029.090220201031 09/02/2020
[ 8763.572117] RIP: 0010:__list_add_valid.cold.0+0x26/0x28
[ 8763.577964] Code: 00 00 00 c3 48 89 d1 48 c7 c7 88 6e 51 91 48 89 c2 e8 a0 da ca ff 0f 0b 48 89 c1 4c 89 c6 48 c7 c7 e0 6e 51 91 e8 8c da ca ff &amp;lt;0f&amp;gt; 0b 48 89 fe 48 89 c2 48 c7 c7 70 6f 51 91 e8 78 da ca ff 0f 0b
[ 8763.598976] RSP: 0018:ffffb7c9658e7d80 EFLAGS: 00010246
[ 8763.604823] RAX: 0000000000000075 RBX: ffff8e98555a72c0 RCX: 0000000000000000
[ 8763.612808] RDX: 0000000000000000 RSI: ffff8ea73fa56818 RDI: ffff8ea73fa56818
[ 8763.620794] RBP: ffff8e98056d2800 R08: 0000000000006475 R09: 0000000000aaaaaa
[ 8763.628779] R10: 0000000000000000 R11: 0000000000000001 R12: ffff8e98555a730c
[ 8763.636765] R13: ffff8e98056d2810 R14: ffff8e9931905c00 R15: 0000000000000000
[ 8763.644751] FS: &#160;0000000000000000(0000) GS:ffff8ea73fa40000(0000) knlGS:0000000000000000
[ 8763.653806] CS: &#160;0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[ 8763.660235] CR2: 000056304a85f748 CR3: 0000000f35610005 CR4: 00000000001706e0
[ 8763.668221] Call Trace:
[ 8763.670972] &#160;lnet_select_pathway+0xebd/0x12d0 [lnet]
[ 8763.676538] &#160;lnet_send+0x5d/0x1b0 [lnet]
[ 8763.680936] &#160;lnet_peer_discovery+0x277/0x11f0 [lnet]
[ 8763.686491] &#160;? __schedule+0x2cc/0x700
[ 8763.690591] &#160;? finish_wait+0x80/0x80
[ 8763.694600] &#160;? lnet_peer_merge_data+0xd50/0xd50 [lnet]
[ 8763.700350] &#160;kthread+0x116/0x130
[ 8763.703962] &#160;? kthread_flush_work_fn+0x10/0x10
[ 8763.708933] &#160;ret_from_fork+0x35/0x40&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</description>
                <environment>2-node cluster:&lt;br/&gt;
Lustre Client / Rocky 8.5 with Lustre 2.12.9&lt;br/&gt;
Lustre Server / CentOS 7.9 with Lustre 2.12.6&lt;br/&gt;
Transport: OPA</environment>
        <key id="74046">LU-16484</key>
            <summary>Linux kernel BUG when deleting and adding a peer and using a filesystem</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="luick">Dean Luick</reporter>
                        <labels>
                    </labels>
                <created>Tue, 17 Jan 2023 21:03:17 +0000</created>
                <updated>Fri, 20 Jan 2023 17:41:46 +0000</updated>
                                            <version>Lustre 2.12.9</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>1</watches>
                                                                            <comments>
                            <comment id="359381" author="JIRAUSER18439" created="Tue, 17 Jan 2023 21:04:58 +0000"  >&lt;p&gt;The steps in the description were an attempt to recreate a failure described in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16349&quot; title=&quot;Excessive number of OPA disconnects / LNET network errors in cluster&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16349&quot;&gt;&lt;del&gt;LU-16349&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="73420">LU-16349</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i03a9j:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>