<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:59:23 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-13216] Kernel NULL pointer dereference in lustre_msg_set_conn_cnt()</title>
                <link>https://jira.whamcloud.com/browse/LU-13216</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;When running auster test suite with SHARED_KEY enabled, sanity-sec test_28 crashes because of a kernel NULL pointer dereference in &lt;tt&gt;lustre_msg_set_conn_cnt()&lt;/tt&gt;. This function gets called from &lt;tt&gt;sptlrpc_req_refresh_ctx()&lt;/tt&gt; via &lt;tt&gt;ctx_refresh_timeout()&lt;/tt&gt;.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[10565.205946] BUG: unable to handle kernel NULL pointer dereference at 0000000000000008
[10565.207453] IP: [&amp;lt;ffffffffc09f0a0c&amp;gt;] lustre_msg_set_conn_cnt+0xc/0xa0 [ptlrpc]
[10565.208767] PGD 80000000797c8067 PUD 7accd067 PMD 0 
[10565.209685] Oops: 0000 [#1] SMP 
[10565.210291] Modules linked in: obdecho(OE) ptlrpc_gss(OE) mgc(OE) lustre(OE) lmv(OE) mdc(OE) fid(OE) osc(OE) lov(OE) fld(OE) ksocklnd(OE) ptlrpc(OE) obdclass(OE) lnet(OE) libcfs(OE) rpcsec_gss_krb5 auth_rpcgss nfsv4 dns_resolver nfs lockd grace fscache rpcrdma ib_isert iscsi_target_mod ib_iser libiscsi scsi_transport_iscsi ib_srpt target_core_mod crc_t10dif crct10dif_generic ib_srp scsi_transport_srp scsi_tgt ib_ipoib rdma_ucm ib_uverbs ib_umad rdma_cm ib_cm iw_cm ib_core sunrpc iosf_mbi crc32_pclmul ghash_clmulni_intel ppdev aesni_intel joydev lrw gf128mul glue_helper ablk_helper cryptd i2c_piix4 pcspkr parport_pc virtio_balloon parport ip_tables ext4 mbcache jbd2 ata_generic pata_acpi virtio_blk 8139too crct10dif_pclmul crct10dif_common crc32c_intel ata_piix serio_raw libata 8139cp virtio_pci virtio_ring
[10565.224100]  virtio mii floppy [last unloaded: libcfs]
[10565.224871] CPU: 0 PID: 21330 Comm: bash Kdump: loaded Tainted: G           OE  ------------   3.10.0-1062.9.1.el7.x86_64 #1
[10565.226677] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
[10565.227736] task: ffff8b8afbeb41c0 ti: ffff8b8adf28c000 task.ti: ffff8b8adf28c000
[10565.229220] RIP: 0010:[&amp;lt;ffffffffc09f0a0c&amp;gt;]  [&amp;lt;ffffffffc09f0a0c&amp;gt;] lustre_msg_set_conn_cnt+0xc/0xa0 [ptlrpc]
[10565.230845] RSP: 0018:ffff8b8adf28f630  EFLAGS: 00010246
[10565.231719] RAX: ffff8b8afafd3800 RBX: ffff8b8afb5a8a00 RCX: ffff8b8adf28ffd8
[10565.232866] RDX: 0000000000000100 RSI: 0000000000000001 RDI: 0000000000000000
[10565.234022] RBP: ffff8b8adf28f640 R08: ffff8b8afb5a8a50 R09: ffff8b8aeb749680
[10565.235166] R10: ffffffff8d9a093d R11: ffff8b8af9354f00 R12: ffff8b8aeb749680
[10565.236317] R13: 0000000000000000 R14: ffff8b8aeb749698 R15: ffff8b8aeb749778
[10565.237469] FS:  00007efeee08d740(0000) GS:ffff8b8affc00000(0000) knlGS:0000000000000000
[10565.238759] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[10565.239692] CR2: 0000000000000008 CR3: 000000007afda000 CR4: 00000000000606f0
[10565.240848] Call Trace:
[10565.241304]  [&amp;lt;ffffffffc0a1d558&amp;gt;] sptlrpc_req_refresh_ctx+0x3c8/0xa50 [ptlrpc]
[10565.242632]  [&amp;lt;ffffffffc078a369&amp;gt;] ? lprocfs_counter_add+0xf9/0x160 [obdclass]
[10565.243806]  [&amp;lt;ffffffffc0a1dd60&amp;gt;] sptlrpc_import_check_ctx+0x180/0x3b0 [ptlrpc]
[10565.245007]  [&amp;lt;ffffffffc09b46e6&amp;gt;] ldlm_lock_match_with_skip+0x216/0x7f0 [ptlrpc]
[10565.246228]  [&amp;lt;ffffffff8d98eb44&amp;gt;] ? vsnprintf+0x234/0x6a0
[10565.247150]  [&amp;lt;ffffffffc0b8a5e9&amp;gt;] mdc_lock_match+0xb9/0x180 [mdc]
[10565.248146]  [&amp;lt;ffffffffc0b8db9b&amp;gt;] mdc_revalidate_lock+0x12b/0x1f0 [mdc]
[10565.249228]  [&amp;lt;ffffffffc0b8df02&amp;gt;] mdc_intent_lock+0x2a2/0x560 [mdc]
[10565.250310]  [&amp;lt;ffffffffc0c2c470&amp;gt;] ? ll_md_need_convert+0x1b0/0x1b0 [lustre]
[10565.251481]  [&amp;lt;ffffffffc09c32a0&amp;gt;] ? ldlm_expired_completion_wait+0x220/0x220 [ptlrpc]
[10565.252778]  [&amp;lt;ffffffffc0b91370&amp;gt;] ? mdc_changelog_cdev_finish+0x1f0/0x1f0 [mdc]
[10565.253995]  [&amp;lt;ffffffffc0bcdd4a&amp;gt;] lmv_intent_lock+0x47a/0xaf0 [lmv]
[10565.255018]  [&amp;lt;ffffffff8d733682&amp;gt;] ? from_kgid+0x12/0x20
[10565.255881]  [&amp;lt;ffffffffc0c2c787&amp;gt;] ? ll_i2suppgid+0x37/0x40 [lustre]
[10565.256918]  [&amp;lt;ffffffffc0c2c7c3&amp;gt;] ? ll_i2gids+0x33/0xb0 [lustre]
[10565.257900]  [&amp;lt;ffffffff8d733682&amp;gt;] ? from_kgid+0x12/0x20
[10565.258772]  [&amp;lt;ffffffffc0c2c470&amp;gt;] ? ll_md_need_convert+0x1b0/0x1b0 [lustre]
[10565.259915]  [&amp;lt;ffffffffc0bfbaee&amp;gt;] ll_inode_revalidate+0x12e/0x690 [lustre]
[10565.261045]  [&amp;lt;ffffffffc0bfc253&amp;gt;] ll_inode_permission+0x203/0x3f0 [lustre]
[10565.262162]  [&amp;lt;ffffffff8d8559b7&amp;gt;] ? __follow_mount_rcu+0x37/0x100
[10565.263156]  [&amp;lt;ffffffff8d8565d1&amp;gt;] __inode_permission+0x71/0xd0
[10565.264107]  [&amp;lt;ffffffff8d856648&amp;gt;] inode_permission+0x18/0x50
[10565.265033]  [&amp;lt;ffffffff8d85a6ae&amp;gt;] link_path_walk+0x27e/0x8b0
[10565.265948]  [&amp;lt;ffffffff8d7bd99b&amp;gt;] ? unlock_page+0x2b/0x30
[10565.266825]  [&amp;lt;ffffffff8d85ae4a&amp;gt;] path_lookupat+0x7a/0x8b0
[10565.267715]  [&amp;lt;ffffffff8d824ef5&amp;gt;] ? kmem_cache_alloc+0x35/0x1f0
[10565.268675]  [&amp;lt;ffffffff8d85c45f&amp;gt;] ? getname_flags+0x4f/0x1a0
[10565.269587]  [&amp;lt;ffffffff8d85b6ab&amp;gt;] filename_lookup+0x2b/0xc0
[10565.270484]  [&amp;lt;ffffffff8d85d5f7&amp;gt;] user_path_at_empty+0x67/0xc0
[10565.271434]  [&amp;lt;ffffffff8d7f3ecd&amp;gt;] ? handle_mm_fault+0x39d/0x9b0
[10565.272388]  [&amp;lt;ffffffff8d85d661&amp;gt;] user_path_at+0x11/0x20
[10565.273249]  [&amp;lt;ffffffff8d850343&amp;gt;] vfs_fstatat+0x63/0xc0
[10565.274099]  [&amp;lt;ffffffff8d8506fe&amp;gt;] SYSC_newstat+0x2e/0x60
[10565.274962]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.276028]  [&amp;lt;ffffffff8dd8de15&amp;gt;] ? system_call_after_swapgs+0xa2/0x146
[10565.277096]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.278163]  [&amp;lt;ffffffff8dd8de15&amp;gt;] ? system_call_after_swapgs+0xa2/0x146
[10565.279227]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.280294]  [&amp;lt;ffffffff8dd8de15&amp;gt;] ? system_call_after_swapgs+0xa2/0x146
[10565.281368]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.282515]  [&amp;lt;ffffffff8dd8de15&amp;gt;] ? system_call_after_swapgs+0xa2/0x146
[10565.283593]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.284709]  [&amp;lt;ffffffff8dd8de15&amp;gt;] ? system_call_after_swapgs+0xa2/0x146
[10565.285797]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.286860]  [&amp;lt;ffffffff8d850bbe&amp;gt;] SyS_newstat+0xe/0x10
[10565.287695]  [&amp;lt;ffffffff8dd8dede&amp;gt;] system_call_fastpath+0x25/0x2a
[10565.288665]  [&amp;lt;ffffffff8dd8de21&amp;gt;] ? system_call_after_swapgs+0xae/0x146
[10565.289730] Code: c0 c7 05 0c ec 07 00 00 00 04 00 e8 af ca c7 ff 48 c7 c7 e0 f5 a6 c0 e8 e3 16 c9 ff 0f 1f 00 66 66 66 66 90 55 48 89 e5 41 54 53 &amp;lt;81&amp;gt; 7f 08 d3 0b d0 0b 48 89 fb 75 1d 41 89 f4 ba 98 00 00 00 31 
[10565.294849] RIP  [&amp;lt;ffffffffc09f0a0c&amp;gt;] lustre_msg_set_conn_cnt+0xc/0xa0 [ptlrpc]
[10565.296089]  RSP &amp;lt;ffff8b8adf28f630&amp;gt;
[10565.296684] CR2: 0000000000000008
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="58023">LU-13216</key>
            <summary>Kernel NULL pointer dereference in lustre_msg_set_conn_cnt()</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="sebastien">Sebastien Buisson</assignee>
                                    <reporter username="sebastien">Sebastien Buisson</reporter>
                        <labels>
                    </labels>
                <created>Fri, 7 Feb 2020 16:43:20 +0000</created>
                <updated>Tue, 17 Mar 2020 18:03:54 +0000</updated>
                            <resolved>Tue, 17 Mar 2020 18:03:54 +0000</resolved>
                                                    <fixVersion>Lustre 2.14.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="262839" author="sebastien" created="Fri, 7 Feb 2020 17:11:52 +0000"  >&lt;p&gt;The problem seems to be due to patch c1fad6a9a5 (&quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10467&quot; title=&quot;use standard linux wait_event macros&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10467&quot;&gt;&lt;del&gt;LU-10467&lt;/del&gt;&lt;/a&gt; ptlrpc: convert waiting in sptlrpc_req_refresh_ctx()&quot;).&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/35987&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/35987&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;This patch aims at converting the waiting routine in &lt;tt&gt;sptlrpc_req_refresh_ctx()&lt;/tt&gt;. But it changes slightly its behavior, in case timeout is 0. With the initial implementation, in case of zero timeout, the timeout callback was not called before starting an infinite, interruptible wait. But with the new implementation, this timeout callback gets called before going for an infinite, interruptible wait.&lt;br/&gt;
Unfortunately, when called with zero timeout, &lt;tt&gt;sptlrpc_req_refresh_ctx()&lt;/tt&gt; is not supposed to try to refresh the request, what the timeout callback &lt;tt&gt;ctx_refresh_timeout()&lt;/tt&gt; precisely does. When it tries, it can hit the bug whose stack trace is detailed above.&lt;/p&gt;

&lt;p&gt;I will propose a patch to address this regression.&lt;/p&gt;</comment>
                            <comment id="262840" author="gerrit" created="Fri, 7 Feb 2020 17:29:06 +0000"  >&lt;p&gt;Sebastien Buisson (sbuisson@ddn.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/37473&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37473&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13216&quot; title=&quot;Kernel NULL pointer dereference in lustre_msg_set_conn_cnt()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13216&quot;&gt;&lt;del&gt;LU-13216&lt;/del&gt;&lt;/a&gt; ptlrpc: do not refresh req in case of zero timeout&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 07c8fb64d3e4191a423314ffba0918c205d52793&lt;/p&gt;</comment>
                            <comment id="265414" author="gerrit" created="Tue, 17 Mar 2020 03:41:12 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/37473/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/37473/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13216&quot; title=&quot;Kernel NULL pointer dereference in lustre_msg_set_conn_cnt()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13216&quot;&gt;&lt;del&gt;LU-13216&lt;/del&gt;&lt;/a&gt; ptlrpc: sptlrpc_req_refresh_ctx&apos;s timeout semantic&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 0b09d826149f4baadce305df63396bf86eb20cf7&lt;/p&gt;</comment>
                            <comment id="265476" author="pjones" created="Tue, 17 Mar 2020 18:03:54 +0000"  >&lt;p&gt;Landed for 2.14&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00tdr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>