<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:23:13 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16013] SLES15 SP4 client BUG: kernel NULL pointer dereference</title>
                <link>https://jira.whamcloud.com/browse/LU-16013</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;While testing SLES15 SP4 client support patch &lt;a href=&quot;https://review.whamcloud.com/47924&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/47924&lt;/a&gt; with kernel 5.14.21-150400.22.1 on Lustre b2_15 branch, sanity test 0d hung.&lt;/p&gt;

&lt;p&gt;Console log on client:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;BUG: kernel NULL pointer dereference, address: 0000000000000000
#PF: supervisor instruction fetch in kernel mode
#PF: error_code(0x0010) - not-present page
PGD 0 P4D 0
T21801] Oops: 0010 [#1] PREEMPT SMP PTI
CPU: 0 PID: 21801 Comm: tee Kdump: loaded Tainted: G           OE     N 5.14.21-150400.22-default #1 SLE15-SP4 0b6a6578ade2de5c4a0b916095dff44f76ef1704
Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
RIP: 0010:0x0
Code: Unable to access opcode bytes at RIP 0xffffffffffffffd6.
RSP: 0018:ffffa052c33b3938 EFLAGS: 00010002
RAX: 0000000000000000 RBX: 0000000000000001 RCX: 0000000000000000
RDX: 0000000000000001 RSI: ffff8dd956c55298 RDI: ffffe011c04cc500
RBP: ffff8dd954416f90 R08: 000000000000041d R09: 0000000000000bf3
R10: ffffa052c33b3940 R11: 0000000000000000 R12: ffff8dd956c55298
R13: 0000000000000000 R14: ffffe011c04cc500 R15: 0000000000000000
FS:  00007f1eaeb68740(0000) GS:ffff8dd9ffc00000(0000) knlGS:0000000000000000 
CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
CR2: ffffffffffffffd6 CR3: 0000000021102001 CR4: 00000000001706f0
Call Trace:
 &amp;lt;TASK&amp;gt;
 vvp_set_pagevec_dirty+0x171/0x3e0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 write_commit_callback+0x5f/0x1a0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 osc_io_commit_async+0x226/0x530 [osc 0cd30f43a98bab30cdcc8c80790581cd345e8072]
 ? vvp_set_pagevec_dirty+0x3e0/0x3e0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 ? vvp_set_pagevec_dirty+0x3e0/0x3e0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 cl_io_commit_async+0x8b/0x160 [obdclass 627f410ec5b64ecc7835c12c3881f5ffa2886afa]
 lov_io_commit_async+0x101/0x5a0 [lov 85fdc8bde1ce6ed86b2cd3053a19a75843ff306a]
 ? vvp_set_pagevec_dirty+0x3e0/0x3e0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 ? vvp_set_pagevec_dirty+0x3e0/0x3e0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 cl_io_commit_async+0x8b/0x160 [obdclass 627f410ec5b64ecc7835c12c3881f5ffa2886afa]
 vvp_io_write_commit+0x151/0x5f0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 vvp_io_write_start+0x8c4/0xc60 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 cl_io_start+0x6c/0x130 [obdclass 627f410ec5b64ecc7835c12c3881f5ffa2886afa]
 cl_io_loop+0x9a/0x200 [obdclass 627f410ec5b64ecc7835c12c3881f5ffa2886afa]
 ll_file_io_generic+0x423/0xc90 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 ll_file_write_iter+0x3f2/0x7b0 [lustre 0967379a0b23e963dac3d44d0227623bfa058caa]
 new_sync_write+0x11f/0x1b0
 vfs_write+0x21c/0x280
 ksys_write+0xa1/0xe0
 do_syscall_64+0x5b/0x80
 ? ksys_write+0x50/0xe0 
 ? do_syscall_64+0x67/0x80
 ? do_sys_open+0x57/0x80
 ? syscall_exit_to_user_mode+0x18/0x40
 ? do_syscall_64+0x67/0x80
 ? exc_page_fault+0x67/0x150
 entry_SYSCALL_64_after_hwframe+0x44/0xae
RIP: 0033:0x7f1eae65db13
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.whamcloud.com/test_sets/227e0686-d7d7-4e4a-9d0b-cdaf599ee00e&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/227e0686-d7d7-4e4a-9d0b-cdaf599ee00e&lt;/a&gt;&lt;/p&gt;</description>
                <environment>SLES15 SP4 client</environment>
        <key id="71156">LU-16013</key>
            <summary>SLES15 SP4 client BUG: kernel NULL pointer dereference</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="paf0186">Patrick Farrell</assignee>
                                    <reporter username="yujian">Jian Yu</reporter>
                        <labels>
                    </labels>
                <created>Thu, 14 Jul 2022 22:52:46 +0000</created>
                <updated>Sat, 13 Aug 2022 02:50:07 +0000</updated>
                            <resolved>Wed, 10 Aug 2022 17:48:05 +0000</resolved>
                                    <version>Lustre 2.15.1</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="340472" author="yujian" created="Thu, 14 Jul 2022 22:56:53 +0000"  >&lt;p&gt;Hi Patrick,&lt;br/&gt;
Could you please advise? Is this related to the changes in &lt;a href=&quot;https://review.whamcloud.com/45927&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45927&lt;/a&gt; (&quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15220&quot; title=&quot;Linux kernel 5.14 support&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15220&quot;&gt;&lt;del&gt;LU-15220&lt;/del&gt;&lt;/a&gt; llite: Compat for set_pagevec_dirty&quot;)?&lt;/p&gt;</comment>
                            <comment id="340473" author="yujian" created="Thu, 14 Jul 2022 23:13:20 +0000"  >&lt;p&gt;FYI, sanity test 0d passed on RHEL 9.0 client with kernel 5.14.0-70.17.1.el9_0.x86_64:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;== sanity test 0d: check export proc ======================================================================================= 16:08:16 (1657840096)
mgc.MGC192.168.0.166@tcp.import=
import:
    name: MGC192.168.0.166@tcp
    target: MGS
    state: FULL
    connect_flags: [ version, barrier, adaptive_timeouts, full20, imp_recov, bulk_mbits, second_flags, reply_mbits ]
    connect_data:
       flags: 0xa000011001002020
       instance: 0
       target_version: 2.15.0.0
    import_flags: [ pingable, connect_tried ]
    connection:
       failover_nids: [ 192.168.0.166@tcp ]
       current_connection: 192.168.0.166@tcp
       connection_attempts: 1
       generation: 1
       in-progress_invalidations: 0
       idle: 5 sec
CMD: vm86 /usr/sbin/lctl get_param -N mgs.MGS.exports.*
CMD: vm86 /usr/sbin/lctl get_param -n mgs.MGS.exports.0@lo.uuid
CMD: vm86 /usr/sbin/lctl get_param -n mgs.MGS.exports.192.168.0.153@tcp.uuid
CMD: vm86 /usr/sbin/lctl get_param mgs.MGS.exports.192.168.0.153@tcp.export
mgs.MGS.exports.192.168.0.153@tcp.export=
eb8166ca-446d-425a-8c5e-04d8d30b3c77:
    name: MGS
    client: 192.168.0.153@tcp
    connect_flags: [ version, barrier, adaptive_timeouts, full20, imp_recov, bulk_mbits, second_flags, reply_mbits ]
    connect_data:
       flags: 0xa000011001002020
       instance: 0
       target_version: 2.15.0.0
    export_flags: [  ]
CMD: vm90 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null
PASS 0d (3s)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="341477" author="paf0186" created="Mon, 25 Jul 2022 16:57:53 +0000"  >&lt;p&gt;Jian,&lt;/p&gt;

&lt;p&gt;Are you able to look at the dump and extract the line of code where the null pointer occurred?&#160; And, also - Does that SLES result in HAVE_KALLSYMS_LOOKUP_NAME defined, or not?&lt;/p&gt;

&lt;p&gt;There&apos;s nothing obviously wrong with the patch, but I don&apos;t immediately know what code is running there either.&lt;/p&gt;</comment>
                            <comment id="341479" author="paf0186" created="Mon, 25 Jul 2022 17:02:07 +0000"  >&lt;p&gt;See comment here for possible thoughts:&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/#/c/45927/6/lustre/llite/vvp_dev.c@292&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/45927/6/lustre/llite/vvp_dev.c@292&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="341544" author="yujian" created="Tue, 26 Jul 2022 06:43:53 +0000"  >&lt;p&gt;Thank you for the advice, Patrick. The failure occurred in autotest run. Let me reproduce it in manual run and debug the codes.&lt;/p&gt;</comment>
                            <comment id="342665" author="yujian" created="Fri, 5 Aug 2022 08:10:46 +0000"  >&lt;p&gt;In kernel 5.14.21-150400.22, kallsyms_lookup_name is defined but account_page_dirtied is not exported:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeHeader panelHeader&quot; style=&quot;border-bottom-width: 1px;&quot;&gt;&lt;b&gt;mm/page-writeback.c&lt;/b&gt;&lt;/div&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
/*
 * Helper function &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; set_page_dirty family.
 *
 * Caller must hold lock_page_memcg().
 *
 * NOTE: This relies on being atomic wrt interrupts.
 */
&lt;span class=&quot;code-keyword&quot;&gt;static&lt;/span&gt; void account_page_dirtied(struct page *page,
                struct address_space *mapping)
{
        struct inode *inode = mapping-&amp;gt;host;

        trace_writeback_dirty_page(page, mapping);

        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (mapping_can_writeback(mapping)) {
                struct bdi_writeback *wb;

                inode_attach_wb(inode, page);
                wb = inode_to_wb(inode);

                __inc_lruvec_page_state(page, NR_FILE_DIRTY);
                __inc_zone_page_state(page, NR_ZONE_WRITE_PENDING);
                __inc_node_page_state(page, NR_DIRTIED);
                inc_wb_stat(wb, WB_RECLAIMABLE);
                inc_wb_stat(wb, WB_DIRTIED);
                task_io_account_write(PAGE_SIZE);
                current-&amp;gt;nr_dirtied++;
                __this_cpu_inc(bdp_ratelimits);

                mem_cgroup_track_foreign_dirty(page, wb);
        }
}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="342799" author="yujian" created="Fri, 5 Aug 2022 21:30:21 +0000"  >&lt;p&gt;After falling back to use __set_page_dirty_nobuffers() while account_page_dirtied() is not found, sanity test 0d passed. I&apos;m creating the patch.&lt;/p&gt;</comment>
                            <comment id="343263" author="pjones" created="Wed, 10 Aug 2022 17:48:05 +0000"  >&lt;p&gt;Fix included in latest &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15959&quot; title=&quot;support for SLES 15 SP4&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15959&quot;&gt;&lt;del&gt;LU-15959&lt;/del&gt;&lt;/a&gt;&#160;patch&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10120">
                    <name>Blocker</name>
                                            <outwardlinks description="is blocking">
                                        <issuelink>
            <issuekey id="70806">LU-15959</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="67158">LU-15220</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i02unb:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>