<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:55:45 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-12799] NULL pointer dereference IP: ptlrpc_disconnect_and_idle_import</title>
                <link>https://jira.whamcloud.com/browse/LU-12799</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Disconnecting from an idle import results in a NULL pointer dereference if the ptlrpc request cannot be allocated due to insufficient free memory.&lt;/p&gt;

&lt;p&gt;From console log:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;&amp;gt; 2019-07-28T07:17:40.193910-05:00 c3-0c1s14n3 page allocation failure: order:0
&amp;gt; 2019-07-28T07:17:40.193923-05:00 c3-0c1s14n3 / mems_allowed=0-1
&amp;gt; 2019-07-28T07:17:40.193938-05:00 c3-0c1s14n3 LustreError: 21724:0:(client.c:893:__ptlrpc_request_alloc()) request allocation out of memory
&amp;gt; 2019-07-28T07:17:40.193953-05:00 c3-0c1s14n3 , mode:0x17080c0(GFP_KERNEL_ACCOUNT|__GFP_ZERO|__GFP_NOTRACK), nodemask=
&amp;gt; 2019-07-28T07:17:40.193967-05:00 c3-0c1s14n3 BUG: unable to handle kernel
&amp;gt; 2019-07-28T07:17:40.193992-05:00 c3-0c1s14n3 (null)
&amp;gt; 2019-07-28T07:17:40.194007-05:00 c3-0c1s14n3 NULL pointer dereference at 0000000000000160
&amp;gt; 2019-07-28T07:17:40.194073-05:00 c3-0c1s14n3 IP: ptlrpc_disconnect_and_idle_import+0x19d/0x290 [ptlrpc]
&amp;gt; 2019-07-28T07:17:40.194088-05:00 c3-0c1s14n3 PGD 0
&amp;gt; 2019-07-28T07:17:40.194103-05:00 c3-0c1s14n3 memfill2 cpuset=
&amp;gt; 2019-07-28T07:17:40.194116-05:00 c3-0c1s14n3 P4D 0
&amp;gt; 2019-07-28T07:17:40.194131-05:00 c3-0c1s14n3 Oops: 0002 [#1] SMP PTI
&amp;gt; 2019-07-28T07:17:40.194146-05:00 c3-0c1s14n3 CPU: 25 PID: 21724 Comm: kworker/25:1 Tainted: P           O     4.12.14-150.17_5.0.84-cray_ari_c #1 SLE15 (unreleased)
&amp;gt; 2019-07-28T07:17:40.194161-05:00 c3-0c1s14n3 Hardware name: Cray Inc. Cascade/Cascade, BIOS 5.11 03/22/2018
&amp;gt; 2019-07-28T07:17:40.194175-05:00 c3-0c1s14n3 2352114
&amp;gt; 2019-07-28T07:17:40.194190-05:00 c3-0c1s14n3 Workqueue: ptlrpc_pinger ptlrpc_pinger_main [ptlrpc]
&amp;gt; 2019-07-28T07:17:40.194204-05:00 c3-0c1s14n3 mems_allowed=0-1
&amp;gt; 2019-07-28T07:17:40.194218-05:00 c3-0c1s14n3 task: ffff8815c1696000 task.stack: ffffc9000753c000
&amp;gt; 2019-07-28T07:17:40.194232-05:00 c3-0c1s14n3 RIP: 0010:ptlrpc_disconnect_and_idle_import+0x19d/0x290 [ptlrpc]
&amp;gt; 2019-07-28T07:17:40.194246-05:00 c3-0c1s14n3 RSP: 0000:ffffc9000753fe18 EFLAGS: 00010296
&amp;gt; 2019-07-28T07:17:40.194261-05:00 c3-0c1s14n3 RAX: 0000000000000001 RBX: ffff881f8c920000 RCX: 0000000000000000
&amp;gt; 2019-07-28T07:17:40.194276-05:00 c3-0c1s14n3 RDX: 0000000000000336 RSI: 0000000000000000 RDI: ffff881f90478c80
&amp;gt; 2019-07-28T07:17:40.194290-05:00 c3-0c1s14n3 RBP: ffffc9000753fe28 R08: 0000000000000000 R09: ffff88118101a358
&amp;gt; 2019-07-28T07:17:40.194304-05:00 c3-0c1s14n3 R10: ffffc9000753f960 R11: ffff88118101a392 R12: 0000000000000000
&amp;gt; 2019-07-28T07:17:40.194319-05:00 c3-0c1s14n3 R13: 0000000000000000 R14: ffff881f8c920278 R15: ffff881f8c920020
&amp;gt; 2019-07-28T07:17:40.194333-05:00 c3-0c1s14n3 FS:  0000000000000000(0000) GS:ffff88203f5c0000(0000) knlGS:0000000000000000
&amp;gt; 2019-07-28T07:17:40.194347-05:00 c3-0c1s14n3 CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
&amp;gt; 2019-07-28T07:17:40.194362-05:00 c3-0c1s14n3 CR2: 0000000000000160 CR3: 0000000001e0a002 CR4: 00000000003606e0
&amp;gt; 2019-07-28T07:17:40.194376-05:00 c3-0c1s14n3 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
&amp;gt; 2019-07-28T07:17:40.194390-05:00 c3-0c1s14n3 DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
&amp;gt; 2019-07-28T07:17:40.194404-05:00 c3-0c1s14n3 Call Trace:
&amp;gt; 2019-07-28T07:17:40.194419-05:00 c3-0c1s14n3 ptlrpc_pinger_main+0x53b/0x900 [ptlrpc]
&amp;gt; 2019-07-28T07:17:40.194432-05:00 c3-0c1s14n3 process_one_work+0x260/0x4a0
&amp;gt; 2019-07-28T07:17:40.194446-05:00 c3-0c1s14n3 worker_thread+0x45/0x420
&amp;gt; 2019-07-28T07:17:40.194460-05:00 c3-0c1s14n3 kthread+0x127/0x140
&amp;gt; 2019-07-28T07:17:40.194475-05:00 c3-0c1s14n3 ? trace_event_raw_event_workqueue_execute_start+0x90/0x90
&amp;gt; 2019-07-28T07:17:40.194490-05:00 c3-0c1s14n3 ? kthread_create_on_node+0x40/0x40
&amp;gt; 2019-07-28T07:17:40.194504-05:00 c3-0c1s14n3 ret_from_fork+0x3a/0x50

&amp;gt; 2019-07-28T07:17:40.194591-05:00 c3-0c1s14n3 CR2: 0000000000000160
&amp;gt; 2019-07-28T07:17:40.194606-05:00 c3-0c1s14n3 ---[ end trace 26bbd436eb3f80b0 ]---
&amp;gt; 2019-07-28T07:17:40.194620-05:00 c3-0c1s14n3 RIP: 0010:ptlrpc_disconnect_and_idle_import+0x19d/0x290 [ptlrpc]
&amp;gt; 2019-07-28T07:17:40.194645-05:00 c3-0c1s14n3 RSP: 0000:ffffc9000753fe18 EFLAGS: 00010296
&amp;gt; 2019-07-28T07:17:40.194672-05:00 c3-0c1s14n3 RAX: 0000000000000001 RBX: ffff881f8c920000 RCX: 0000000000000000
&amp;gt; 2019-07-28T07:17:40.194686-05:00 c3-0c1s14n3 RDX: 0000000000000336 RSI: 0000000000000000 RDI: ffff881f90478c80
&amp;gt; 2019-07-28T07:17:40.194701-05:00 c3-0c1s14n3 RBP: ffffc9000753fe28 R08: 0000000000000000 R09: ffff88118101a358
&amp;gt; 2019-07-28T07:17:40.194715-05:00 c3-0c1s14n3 R10: ffffc9000753f960 R11: ffff88118101a392 R12: 0000000000000000
&amp;gt; 2019-07-28T07:17:40.194729-05:00 c3-0c1s14n3 R13: 0000000000000000 R14: ffff881f8c920278 R15: ffff881f8c920020
&amp;gt; 2019-07-28T07:17:40.194744-05:00 c3-0c1s14n3 FS:  0000000000000000(0000) GS:ffff88203f5c0000(0000) knlGS:0000000000000000
&amp;gt; 2019-07-28T07:17:40.194758-05:00 c3-0c1s14n3 CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
&amp;gt; 2019-07-28T07:17:40.194772-05:00 c3-0c1s14n3 CR2: 0000000000000160 CR3: 0000000001e0a002 CR4: 00000000003606e0
&amp;gt; 2019-07-28T07:17:40.194788-05:00 c3-0c1s14n3 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
&amp;gt; 2019-07-28T07:17:40.194802-05:00 c3-0c1s14n3 DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
&amp;gt; 2019-07-28T07:17:40.194818-05:00 c3-0c1s14n3 Kernel panic - not syncing: Fatal exception
&amp;gt; 2019-07-28T07:17:40.194832-05:00 c3-0c1s14n3 Shutting down cpus with NMI
&amp;gt; 2019-07-28T07:17:40.194846-05:00 c3-0c1s14n3 Kernel Offset: disabled
&amp;gt; 2019-07-28T07:17:40.194860-05:00 c3-0c1s14n3 ---[ end Kernel panic - not syncing: Fatal exception
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;From dklog:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;crash_x86_64&amp;gt; epython dk | grep &apos;:21724:&apos;
00000100:00080000:25.0:1564316239.230647:000000:21724:0:(import.c:1781:ptlrpc_disconnect_and_idle_import()) snx11242-OST0001-osc-ffff880f866d1000: disconnect after 81s idle
00000100:00080000:25.0:1564316239.230650:000000:21724:0:(import.c:1624:ptlrpc_disconnect_prep_req()) ffff881f8aeee000 snx11242-OST0002_UUID: changing import state from FULL to CONNECTING
00000100:00080000:25.0:1564316239.230651:000000:21724:0:(import.c:1781:ptlrpc_disconnect_and_idle_import()) snx11242-OST0002-osc-ffff880f866d1000: disconnect after 80s idle
00000100:00020000:25.0:1564316255.177461:000000:21724:0:(client.c:893:__ptlrpc_request_alloc()) request allocation out of memory
00000100:00080000:25.0:1564316255.180754:000000:21724:0:(import.c:1781:ptlrpc_disconnect_and_idle_import()) snx11242-OST0003-osc-ffff880f866d1000: disconnect after 97s idle

crash_x86_64&amp;gt; epython obd_devs
obd_device          obd_name               	ip_address             client_obd          obd_import          imp_state    ish_time   index   conn_cnt
========================================================================================================================================================
0xffff881fa37703c0  snx11242-OST0003      	10.155.10.8@o2ib3003  	 0xffff881fa3770868  0xffff881f8c920000  FULL       1564316158     5   141
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;obd_import 0xffff881f8c920000 is idle so ptlrpc_disconnect_and_idle_import() is called.&lt;br/&gt;
Node is out of memory so ptlrpc_disconnect_prep_req(imp) returns NULL but error handling only checks for a bad pointer. Doesn&apos;t handle the NULL case.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;1757 int ptlrpc_disconnect_and_idle_import(struct obd_import *imp)
1758 {
...
1775         req = ptlrpc_disconnect_prep_req(imp);
1776         if (IS_ERR(req))
1777                 RETURN(PTR_ERR(req));
1778
1779         CDEBUG_LIMIT(imp-&amp;gt;imp_idle_debug, &quot;%s: disconnect after %llus idle\n&quot;,
1780                      imp-&amp;gt;imp_obd-&amp;gt;obd_name,
1781                      ktime_get_real_seconds() - imp-&amp;gt;imp_last_reply_time);
1782         req-&amp;gt;rq_interpret_reply = ptlrpc_disconnect_idle_interpret;    &amp;lt;---- NULL pointer dereference
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="56983">LU-12799</key>
            <summary>NULL pointer dereference IP: ptlrpc_disconnect_and_idle_import</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="amk">Ann Koehler</assignee>
                                    <reporter username="amk">Ann Koehler</reporter>
                        <labels>
                    </labels>
                <created>Tue, 24 Sep 2019 20:22:51 +0000</created>
                <updated>Mon, 10 Feb 2020 16:47:17 +0000</updated>
                            <resolved>Wed, 23 Oct 2019 03:36:54 +0000</resolved>
                                    <version>Lustre 2.12.2</version>
                                    <fixVersion>Lustre 2.13.0</fixVersion>
                    <fixVersion>Lustre 2.14.0</fixVersion>
                    <fixVersion>Lustre 2.12.4</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="255321" author="gerrit" created="Tue, 24 Sep 2019 20:30:30 +0000"  >&lt;p&gt;Alex Zhuravlev (bzzz@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/36282&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/36282&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12799&quot; title=&quot;NULL pointer dereference IP: ptlrpc_disconnect_and_idle_import&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12799&quot;&gt;&lt;del&gt;LU-12799&lt;/del&gt;&lt;/a&gt; ptlrpc: return proper error code&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 108a7f819ad5241c095779a6f70ba524606b3328&lt;/p&gt;</comment>
                            <comment id="256887" author="gerrit" created="Tue, 22 Oct 2019 23:57:32 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/36282/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/36282/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12799&quot; title=&quot;NULL pointer dereference IP: ptlrpc_disconnect_and_idle_import&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12799&quot;&gt;&lt;del&gt;LU-12799&lt;/del&gt;&lt;/a&gt; ptlrpc: return proper error code&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 9e2620d75cce1e1b4855704ddd9a994ce8e8d650&lt;/p&gt;</comment>
                            <comment id="256906" author="pjones" created="Wed, 23 Oct 2019 03:36:54 +0000"  >&lt;p&gt;Landed for 2.13&lt;/p&gt;</comment>
                            <comment id="260784" author="gerrit" created="Wed, 8 Jan 2020 19:24:24 +0000"  >&lt;p&gt;Andreas Dilger (adilger@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/37164&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37164&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12799&quot; title=&quot;NULL pointer dereference IP: ptlrpc_disconnect_and_idle_import&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12799&quot;&gt;&lt;del&gt;LU-12799&lt;/del&gt;&lt;/a&gt; ptlrpc: return proper error code&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: ef4895857f85ad4f15c50b3db39732644c97b309&lt;/p&gt;</comment>
                            <comment id="261935" author="gerrit" created="Mon, 27 Jan 2020 23:12:34 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/37164/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37164/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12799&quot; title=&quot;NULL pointer dereference IP: ptlrpc_disconnect_and_idle_import&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12799&quot;&gt;&lt;del&gt;LU-12799&lt;/del&gt;&lt;/a&gt; ptlrpc: return proper error code&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 939d8bb0cf88babe1b9812bc03e07d7811bf2770&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00n7j:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>