<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:16:29 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-8316] BUG: unable to handle kernel NULL pointer dereference at  tgt_free_reply_data+0x97/0x330 </title>
                <link>https://jira.whamcloud.com/browse/LU-8316</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;System crashed while testing under memory pressure:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[432534.561808] Lustre: lustre-MDT0000: Will be in recovery for at least 1:00, or until 2 clients reconnect
[432534.563083] Lustre: Skipped 3 previous similar messages
[432534.593088] BUG: unable to handle kernel NULL pointer dereference at           (null)
[432534.594035] IP: [&amp;lt;ffffffffa07d31f7&amp;gt;] tgt_free_reply_data+0x97/0x330 [ptlrpc]
[432534.594035] PGD 3c7cb067 PUD 3836e067 PMD 0 
[432534.594035] Oops: 0002 [#1] SMP 
[432534.594035] Modules linked in: lustre(OF) ofd(OF) osp(OF) lod(OF) ost(OF) mdt(OF) mdd(OF) mgs(OF) osd_ldiskfs(OF) ldiskfs(OF) lquota(OF) lfsck(OF) obdecho(OF) mgc(OF) lov(OF) osc(OF) mdc(OF) lmv(OF) fid(OF) fld(OF) ptlrpc(OF) obdclass(OF) ksocklnd(OF) lnet(OF) libcfs(OF) loop mbcache jbd2 sha512_generic netconsole sg dm_mirror dm_region_hash dm_log crct10dif_pclmul crct10dif_common crc32_pclmul crc32c_intel ghash_clmulni_intel aesni_intel lrw gf128mul glue_helper ablk_helper cryptd serio_raw virtio_balloon virtio_console dm_mod intel_agp i2c_piix4 intel_gtt nfsd auth_rpcgss nfs_acl lockd sunrpc ip_tables xfs ata_generic libcrc32c virtio_net cirrus syscopyarea sysfillrect sysimgblt virtio_scsi drm_kms_helper virtio_blk ttm drm virtio_pci agpgart ata_piix virtio_ring libata virtio i2c_core [last unloaded: libcfs]
[432534.594035] CPU: 1 PID: 5669 Comm: mdt01_003 Tainted: GF          O--------------   3.10.0-229.7.2.x86_64 #7
[432534.594035] Hardware name: QEMU Standard PC (i440FX + PIIX, 1996), BIOS 1.7.5-20140709_153950- 04/01/2014
[432534.594035] task: ffff880025081580 ti: ffff88002da2c000 task.ti: ffff88002da2c000
[432534.594035] RIP: 0010:[&amp;lt;ffffffffa07d31f7&amp;gt;]  [&amp;lt;ffffffffa07d31f7&amp;gt;] tgt_free_reply_data+0x97/0x330 [ptlrpc]
[432534.594035] RSP: 0018:ffff88002da2fb90  EFLAGS: 00010293
[432534.594035] RAX: 0000000000000001 RBX: ffff8800133fb8d8 RCX: 0000000000000000
[432534.594035] RDX: 0000000000000000 RSI: ffff88001289f300 RDI: ffff8800133fb8d8
[432534.594035] RBP: ffff88002da2fbd8 R08: ffff8800133fb8d8 R09: 0000000000000000
[432534.594035] R10: 0000000000000000 R11: 0000000000000000 R12: 0000000000000001
[432534.594035] R13: ffff880000e65718 R14: ffff88001289f3f8 R15: ffff88001289f300
[432534.594035] FS:  0000000000000000(0000) GS:ffff88003fd00000(0000) knlGS:0000000000000000
[432534.594035] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[432534.594035] CR2: 0000000000bfc001 CR3: 000000003c289000 CR4: 00000000001406e0
[432534.594035] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
[432534.594035] DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
[432534.594035] Stack:
[432534.594035]  0000000000000000 ffff88001289f3f8 ffffffff810c486d ffff88002da2fc30
[432534.594035]  ffff8800133fb8d8 ffff88001289f300 ffff88001289ef60 ffff88001289f3f8
[432534.594035]  ffff880000e65718 ffff88002da2fc30 ffffffffa07d34ee 0000000000000246
[432534.594035] Call Trace:
[432534.594035]  [&amp;lt;ffffffff810c486d&amp;gt;] ? trace_hardirqs_on+0xd/0x10
[432534.594035]  [&amp;lt;ffffffffa07d34ee&amp;gt;] tgt_release_reply_data+0x5e/0x180 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffffa07dc128&amp;gt;] tgt_handle_received_xid+0x98/0xe0 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffffa07e1d38&amp;gt;] tgt_request_handle+0xb88/0x1330 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffffa078d591&amp;gt;] ptlrpc_server_handle_request+0x231/0xac0 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffffa078be15&amp;gt;] ? ptlrpc_wait_event+0xa5/0x360 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffffa0791790&amp;gt;] ptlrpc_main+0xab0/0x1e10 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffff810c486d&amp;gt;] ? trace_hardirqs_on+0xd/0x10
[432534.594035]  [&amp;lt;ffffffff8109b842&amp;gt;] ? finish_task_switch+0x42/0x150
[432534.594035]  [&amp;lt;ffffffffa0790ce0&amp;gt;] ? ptlrpc_register_service+0xe50/0xe50 [ptlrpc]
[432534.594035]  [&amp;lt;ffffffff8109008a&amp;gt;] kthread+0xea/0xf0
[432534.594035]  [&amp;lt;ffffffff8108ffa0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[432534.594035]  [&amp;lt;ffffffff81571258&amp;gt;] ret_from_fork+0x58/0x90
[432534.594035]  [&amp;lt;ffffffff8108ffa0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[432534.594035] Code: c1 fa 1f c1 ea 0c c1 f9 14 41 8d 04 14 25 ff ff 0f 00 29 d0 83 f9 0f 0f 8f 72 02 00 00 49 8b 95 28 04 00 00 48 63 c9 48 8b 14 ca &amp;lt;f0&amp;gt; 0f b3 02 19 c0 85 c0 0f 84 8b 01 00 00 48 85 db 0f 84 1b 02 
[432534.594035] RIP  [&amp;lt;ffffffffa07d31f7&amp;gt;] tgt_free_reply_data+0x97/0x330 [ptlrpc]
[432534.594035]  RSP &amp;lt;ffff88002da2fb90&amp;gt;
[432534.594035] CR2: 0000000000000000
[432534.712915] ---[ end trace 26ac593d02d07dd0 ]---
[432534.714120] Kernel panic - not syncing: Fatal exception

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This issue is caused by error return value in :&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;        /* reply_data is supported by MDT targets only for now */
        if (strncmp(obd-&amp;gt;obd_type-&amp;gt;typ_name, LUSTRE_MDT_NAME, 3) != 0)
                RETURN(0);

        OBD_ALLOC(lut-&amp;gt;lut_reply_bitmap,
                  LUT_REPLY_SLOTS_MAX_CHUNKS * sizeof(unsigned long *));
        if (lut-&amp;gt;lut_reply_bitmap == NULL)
                GOTO(out, rc);
-----------------------------^^^

        memset(&amp;amp;attr, 0, sizeof(attr));
        attr.la_valid = LA_MODE;

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I&apos;ll push a patch for it.&lt;/p&gt;</description>
                <environment></environment>
        <key id="37737">LU-8316</key>
            <summary>BUG: unable to handle kernel NULL pointer dereference at  tgt_free_reply_data+0x97/0x330 </summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="ys">Yang Sheng</reporter>
                        <labels>
                    </labels>
                <created>Wed, 22 Jun 2016 12:47:39 +0000</created>
                <updated>Mon, 11 May 2020 17:47:28 +0000</updated>
                            <resolved>Mon, 11 May 2020 17:47:28 +0000</resolved>
                                    <version>Lustre 2.11.0</version>
                                    <fixVersion>Lustre 2.9.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="156482" author="gerrit" created="Wed, 22 Jun 2016 13:21:25 +0000"  >&lt;p&gt;Yang Sheng (yang.sheng@intel.com) uploaded a new patch: &lt;a href=&quot;http://review.whamcloud.com/20918&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/20918&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8316&quot; title=&quot;BUG: unable to handle kernel NULL pointer dereference at  tgt_free_reply_data+0x97/0x330 &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8316&quot;&gt;&lt;del&gt;LU-8316&lt;/del&gt;&lt;/a&gt; tgt: return -ENOMEM while kmalloc failed&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: bfff1305da9b03766b253631a729a0007fbd6782&lt;/p&gt;</comment>
                            <comment id="156668" author="green" created="Thu, 23 Jun 2016 14:30:16 +0000"  >&lt;p&gt;Must be a dup of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8199&quot; title=&quot;NULL pointer dereference in tgt_free_reply_data&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8199&quot;&gt;&lt;del&gt;LU-8199&lt;/del&gt;&lt;/a&gt; that also have a patch?&lt;/p&gt;</comment>
                            <comment id="157228" author="ys" created="Wed, 29 Jun 2016 04:07:16 +0000"  >&lt;p&gt;Hi, Oleg,&lt;/p&gt;

&lt;p&gt;Yes, I think it is almost dup of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8199&quot; title=&quot;NULL pointer dereference in tgt_free_reply_data&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8199&quot;&gt;&lt;del&gt;LU-8199&lt;/del&gt;&lt;/a&gt;. But 8199 patch is a improvement patch. This is a bug fixed patch. They are not conflict.&lt;/p&gt;</comment>
                            <comment id="157735" author="gerrit" created="Tue, 5 Jul 2016 23:52:05 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;http://review.whamcloud.com/20918/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/20918/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8316&quot; title=&quot;BUG: unable to handle kernel NULL pointer dereference at  tgt_free_reply_data+0x97/0x330 &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8316&quot;&gt;&lt;del&gt;LU-8316&lt;/del&gt;&lt;/a&gt; tgt: return -ENOMEM while kmalloc failed&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 36451f3be0bbc7858d848b5b6ee6e9133de9115d&lt;/p&gt;</comment>
                            <comment id="157749" author="ys" created="Wed, 6 Jul 2016 02:34:43 +0000"  >&lt;p&gt;Patch landed. Close ticket.&lt;/p&gt;</comment>
                            <comment id="226639" author="green" created="Tue, 24 Apr 2018 17:01:08 +0000"  >&lt;p&gt;I just had this hit again on current master-next.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[178184.101361] Lustre: DEBUG MARKER: == replay-single test 39: test recovery from unlink llog (test llog_gen_rec) ========================= 02:06:10 (1524377170)
[178187.227063] Turning device loop0 (0x700000) read-only
[178187.304890] Lustre: DEBUG MARKER: mds1 REPLAY BARRIER on lustre-MDT0000
[178187.327340] Lustre: DEBUG MARKER: local REPLAY BARRIER on lustre-MDT0000
[178189.095109] LustreError: 25219:0:(client.c:1147:ptlrpc_import_delay_req()) @@@ IMP_CLOSED   req@ffff8802930a6c00 x1598423905600144/t0(0) o6-&amp;gt;lustre-OST0000-osc-MDT0000@0@lo:28/4 lens 664/432 e 0 to 0 dl 0 ref 1 fl Rpc:/0/ffffffff rc 0/-1
[178189.160680] BUG: unable to handle kernel NULL pointer dereference at           (null)
[178189.162062] IP: [&amp;lt;ffffffffa06557d3&amp;gt;] tgt_free_reply_data+0x93/0x370 [ptlrpc]
[178189.163275] PGD 0 
[178189.163867] Oops: 0000 [#1] SMP DEBUG_PAGEALLOC
[178189.164595] Modules linked in: lustre(OE) ofd(OE) osp(OE) lod(OE) ost(OE) mdt(OE) mdd(OE) mgs(OE) osd_ldiskfs(OE) ldiskfs(OE) lquota(OE) lfsck(OE) obdecho(OE) mgc(OE) lov(OE) mdc(OE) osc(OE) lmv(OE) fid(OE) fld(OE) ptlrpc_gss(OE) ptlrpc(OE) obdclass(OE) ksocklnd(OE) lnet(OE) libcfs(OE) loop zfs(PO) zunicode(PO) zavl(PO) icp(PO) zcommon(PO) znvpair(PO) spl(O) zlib_deflate mbcache jbd2 syscopyarea sysfillrect sysimgblt ata_generic ttm pata_acpi drm_kms_helper drm ata_piix i2c_piix4 libata pcspkr serio_raw virtio_balloon virtio_blk virtio_console i2c_core floppy nfsd ip_tables rpcsec_gss_krb5 [last unloaded: libcfs]
[178189.172341] CPU: 3 PID: 143 Comm: kworker/3:1 Tainted: P           OE  ------------   3.10.0-debug #2
[178189.176342] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
[178189.177281] Workqueue: obd_zombid obd_zombie_exp_cull [obdclass]
[178189.177975] task: ffff88032107e4c0 ti: ffff880321084000 task.ti: ffff880321084000
[178189.182094] RIP: 0010:[&amp;lt;ffffffffa06557d3&amp;gt;]  [&amp;lt;ffffffffa06557d3&amp;gt;] tgt_free_reply_data+0x93/0x370 [ptlrpc]
[178189.183637] RSP: 0018:ffff880321087c68  EFLAGS: 00010293
[178189.184412] RAX: 0000000000000000 RBX: ffff88025d2b5500 RCX: 0000000000000000
[178189.185641] RDX: 0000000000000000 RSI: ffff8800a9644be0 RDI: ffff88025d2b5500
[178189.187161] RBP: ffff880321087cb0 R08: ffff88025d2b5500 R09: 0000000000000000
[178189.188393] R10: 0000000000000000 R11: ffff88028dce37e0 R12: 0000000000000000
[178189.189623] R13: ffff88029383c0b0 R14: ffff88029383c0b0 R15: ffff8800a9644be0
[178189.190921] FS:  0000000000000000(0000) GS:ffff88033e460000(0000) knlGS:0000000000000000
[178189.192189] CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
[178189.192849] CR2: 0000000000000000 CR3: 0000000001c0e000 CR4: 00000000000006e0
[178189.194304] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
[178189.195545] DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
[178189.196776] Stack:
[178189.197399]  ffff88032107e4c0 ffff8800a9644be0 0000000000000000 ffff880321087fd8
[178189.199036]  ffff88027eaa9400 ffff8800a9644be0 ffff8800a9644be0 ffff88029383c0b0
[178189.201390]  ffff88029383c0b0 ffff880321087d08 ffffffffa0655b38 ffff880321087d10
[178189.207062] Call Trace:
[178189.207804]  [&amp;lt;ffffffffa0655b38&amp;gt;] tgt_release_reply_data+0x88/0x180 [ptlrpc]
[178189.208621]  [&amp;lt;ffffffffa02183d8&amp;gt;] ? cfs_hash_putref+0x2e8/0x500 [libcfs]
[178189.209388]  [&amp;lt;ffffffffa06562e1&amp;gt;] tgt_client_free+0x81/0x360 [ptlrpc]
[178189.210344]  [&amp;lt;ffffffffa0cda13a&amp;gt;] mdt_destroy_export+0x5a/0x200 [mdt]
[178189.211100]  [&amp;lt;ffffffffa0395815&amp;gt;] class_export_destroy+0xe5/0x490 [obdclass]
[178189.211914]  [&amp;lt;ffffffffa0395bd5&amp;gt;] obd_zombie_exp_cull+0x15/0x20 [obdclass]
[178189.212897]  [&amp;lt;ffffffff8109adb6&amp;gt;] process_one_work+0x206/0x5b0
[178189.213660]  [&amp;lt;ffffffff8109ad4b&amp;gt;] ? process_one_work+0x19b/0x5b0
[178189.214358]  [&amp;lt;ffffffff8109b27b&amp;gt;] worker_thread+0x11b/0x3a0
[178189.215037]  [&amp;lt;ffffffff8109b160&amp;gt;] ? process_one_work+0x5b0/0x5b0
[178189.215718]  [&amp;lt;ffffffff810a2eba&amp;gt;] kthread+0xea/0xf0
[178189.216382]  [&amp;lt;ffffffff810a2dd0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[178189.217103]  [&amp;lt;ffffffff8170fb98&amp;gt;] ret_from_fork+0x58/0x90
[178189.217805]  [&amp;lt;ffffffff810a2dd0&amp;gt;] ? kthread_create_on_node+0x140/0x140
[178189.251576] Code: 41 0f 49 cc c1 fa 1f c1 ea 0c c1 f9 14 41 8d 04 14 25 ff ff 0f 00 29 d0 83 f9 0f 0f 8f b1 02 00 00 49 8b 95 58 04 00 00 48 63 c9 &amp;lt;48&amp;gt; 8b 14 ca 48 85 d2 0f 84 cf 01 00 00 f0 0f b3 02 19 c0 85 c0 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="226640" author="green" created="Tue, 24 Apr 2018 17:01:26 +0000"  >&lt;p&gt;seems to be still present&lt;/p&gt;</comment>
                            <comment id="269845" author="green" created="Mon, 11 May 2020 17:47:28 +0000"  >&lt;p&gt;that did not reoccur since Apr 23, 2018 in my testing it seems&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="37182">LU-8199</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzyfcf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>