<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:09:26 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14402] LBUG: osd_write_commit() ASSERTION( !PageDirty(lnb[i].lnb_page) ) failed</title>
                <link>https://jira.whamcloud.com/browse/LU-14402</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 6733.016726] perf: interrupt took too long (3163 &amp;gt; 3126), lowering kernel.perf_event_max_sample_rate to 63000
[ 6953.568157] LustreError: 29459:0:(osd_io.c:1558:osd_write_commit()) ASSERTION( !PageDirty(lnb[i].lnb_page) ) failed: 
[ 6953.579769] LustreError: 29459:0:(osd_io.c:1558:osd_write_commit()) LBUG
[ 6953.587203] Pid: 29459, comm: ll_ost_io00_523 3.10.0-957.1.3957.1.3.x3.4.37.x86_64 #1 SMP Mon Jan 13 18:26:28 PST 2020
[ 6953.598541] Call Trace:
[ 6953.601529]  [&amp;lt;ffffffffc11e862c&amp;gt;] libcfs_call_trace+0x8c/0xc0 [libcfs]
[ 6953.608765]  [&amp;lt;ffffffffc11e894c&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
[ 6953.615539]  [&amp;lt;ffffffffc1dffcac&amp;gt;] osd_write_commit+0x52c/0x870 [osd_ldiskfs]
[ 6953.623529]  [&amp;lt;ffffffffc1c24769&amp;gt;] ofd_commitrw_write+0xde9/0x1480 [ofd]
[ 6953.630806]  [&amp;lt;ffffffffc1c2861d&amp;gt;] ofd_commitrw+0x2ad/0x9a0 [ofd]
[ 6953.637512]  [&amp;lt;ffffffffc171dac9&amp;gt;] tgt_brw_write+0xfd9/0x1cc0 [ptlrpc]
[ 6953.644747]  [&amp;lt;ffffffffc1719c4a&amp;gt;] tgt_request_handle+0x7ea/0x1750 [ptlrpc]
[ 6953.652474]  [&amp;lt;ffffffffc16bd136&amp;gt;] ptlrpc_server_handle_request+0x256/0xb10 [ptlrpc]
[ 6953.661074]  [&amp;lt;ffffffffc16c1c8c&amp;gt;] ptlrpc_main+0xb3c/0x14e0 [ptlrpc]
[ 6953.668522]  [&amp;lt;ffffffffba6c1c31&amp;gt;] kthread+0xd1/0xe0
[ 6953.674378]  [&amp;lt;ffffffffbad76c1d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[ 6953.681517]  [&amp;lt;ffffffffffffffff&amp;gt;] 0xffffffffffffffff
[ 6953.687422] Kernel panic - not syncing: LBUG
[ 6953.692298] CPU: 11 PID: 29459 Comm: ll_ost_io00_523 Kdump: loaded Tainted: P           OE  ------------   3.10.0-957.1.3957.1.3.x3.4.37.x86_64 #1
[ 6953.706675] Hardware name: Seagate Laguna Seca/Laguna Seca, BIOS v02.0040 06/29/2018
[ 6953.715123] Call Trace:
[ 6953.718301]  [&amp;lt;ffffffffbad63e41&amp;gt;] dump_stack+0x19/0x1b
[ 6953.724122]  [&amp;lt;ffffffffbad5d550&amp;gt;] panic+0xe8/0x21f
[ 6953.729700]  [&amp;lt;ffffffffc11e899b&amp;gt;] lbug_with_loc+0x9b/0xa0 [libcfs]
[ 6953.736628]  [&amp;lt;ffffffffc1dffcac&amp;gt;] osd_write_commit+0x52c/0x870 [osd_ldiskfs]
[ 6953.744395]  [&amp;lt;ffffffffc1c24769&amp;gt;] ofd_commitrw_write+0xde9/0x1480 [ofd]
[ 6953.751678]  [&amp;lt;ffffffffc1c2861d&amp;gt;] ofd_commitrw+0x2ad/0x9a0 [ofd]
[ 6953.758374]  [&amp;lt;ffffffffc171dac9&amp;gt;] tgt_brw_write+0xfd9/0x1cc0 [ptlrpc]
[ 6953.765463]  [&amp;lt;ffffffffba6db748&amp;gt;] ? __enqueue_entity+0x78/0x80
[ 6953.771941]  [&amp;lt;ffffffffba6e236f&amp;gt;] ? enqueue_entity+0x2ef/0xbe0
[ 6953.778575]  [&amp;lt;ffffffffc16d6d97&amp;gt;] ? __req_capsule_get+0x427/0x6b0 [ptlrpc]
[ 6953.786210]  [&amp;lt;ffffffffc1719c4a&amp;gt;] tgt_request_handle+0x7ea/0x1750 [ptlrpc]
[ 6953.793817]  [&amp;lt;ffffffffc16f3bc1&amp;gt;] ? ptlrpc_nrs_req_get_nolock0+0xd1/0x170 [ptlrpc]
[ 6953.802150]  [&amp;lt;ffffffffc11e502e&amp;gt;] ? ktime_get_real_seconds+0xe/0x10 [libcfs]
[ 6953.809942]  [&amp;lt;ffffffffc16bd136&amp;gt;] ptlrpc_server_handle_request+0x256/0xb10 [ptlrpc]
[ 6953.818313]  [&amp;lt;ffffffffba6cec64&amp;gt;] ? __wake_up+0x44/0x50
[ 6953.824396]  [&amp;lt;ffffffffc16c1c8c&amp;gt;] ptlrpc_main+0xb3c/0x14e0 [ptlrpc]
[ 6953.831440]  [&amp;lt;ffffffffc16c1150&amp;gt;] ? ptlrpc_register_service+0xf90/0xf90 [ptlrpc]
[ 6953.839649]  [&amp;lt;ffffffffba6c1c31&amp;gt;] kthread+0xd1/0xe0
[ 6953.845394]  [&amp;lt;ffffffffba6c1b60&amp;gt;] ? insert_kthread_work+0x40/0x40
[ 6953.852303]  [&amp;lt;ffffffffbad76c1d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[ 6953.859587]  [&amp;lt;ffffffffba6c1b60&amp;gt;] ? insert_kthread_work+0x40/0x40
(END)

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="62700">LU-14402</key>
            <summary>LBUG: osd_write_commit() ASSERTION( !PageDirty(lnb[i].lnb_page) ) failed</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="stancheff">Shaun Tancheff</reporter>
                        <labels>
                    </labels>
                <created>Thu, 4 Feb 2021 13:18:34 +0000</created>
                <updated>Sat, 23 Oct 2021 01:34:09 +0000</updated>
                            <resolved>Sat, 23 Oct 2021 01:34:09 +0000</resolved>
                                    <version>Lustre 2.14.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="313371" author="stancheff" created="Sun, 19 Sep 2021 14:37:30 +0000"  >&lt;p&gt;As of:  v2_14_54-52-g1887169365&lt;/p&gt;

&lt;p&gt;I am still hitting this LBUG.&lt;/p&gt;

&lt;p&gt;Ex:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Sep 19 09:21:52 snx11922n005 kernel: LustreError: 24267:0:(osd_io.c:1608:osd_write_commit()) ASSERTION( !PageDirty(lnb[i].lnb_page) ) failed: 
Sep 19 09:21:52 snx11922n005 kernel: LustreError: 24267:0:(osd_io.c:1608:osd_write_commit()) LBUG
Sep 19 09:21:52 snx11922n005 kernel: Pid: 24267, comm: ll_ost_io00_713 3.10.0-957.1.3957.1.3.x3.4.37.x86_64 #1 SMP Mon Jan 13 18:26:28 PST 2020
Sep 19 09:21:52 snx11922n005 kernel: IEC: 026000003: LASSERT: { &quot;pid&quot;: &quot;24267&quot;, &quot;ext_pid&quot;: &quot;0&quot;, &quot;filename&quot;: &quot;osd_io.c&quot;, &quot;line&quot;: &quot;1608&quot;, &quot;func_name&quot;: &quot;osd_write_commit&quot;, &quot;assert_info&quot;: &quot;( !PageDirty(lnb[i].lnb_page) ) failed: &quot; }
Sep 19 09:21:52 snx11922n005 kernel: IEC: 026000004: LBUG: { &quot;pid&quot;: &quot;24267&quot;, &quot;ext_pid&quot;: &quot;0&quot;, &quot;filename&quot;: &quot;osd_io.c&quot;, &quot;line&quot;: &quot;1608&quot;, &quot;func_name&quot;: &quot;osd_write_commit&quot; }
Sep 19 09:21:52 snx11922n005 kernel: Call Trace:
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] libcfs_call_trace+0x90/0xf0 [libcfs]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] osd_write_commit+0x52c/0x880 [osd_ldiskfs]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] ofd_commitrw_write+0xef9/0x15d0 [ofd]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] ofd_commitrw+0x335/0x9f0 [ofd]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] tgt_brw_write+0x176a/0x2310 [ptlrpc]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] tgt_request_handle+0x823/0x1850 [ptlrpc]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] ptlrpc_server_handle_request+0x253/0xb10 [ptlrpc]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] ptlrpc_main+0xbf4/0x15e0 [ptlrpc]
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] kthread+0xd1/0xe0
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
Sep 19 09:21:52 snx11922n005 kernel: [&amp;lt;0&amp;gt;] 0xfffffffffffffffe
Sep 19 09:21:52 snx11922n005 kernel: Kernel panic - not syncing: LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Also kindly note that this includes the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14640&quot; title=&quot;ASSERTION( !PageDirty(lnb[i].lnb_page) in osd_write_commit()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14640&quot;&gt;&lt;del&gt;LU-14640&lt;/del&gt;&lt;/a&gt; fix &lt;a href=&quot;https://review.whamcloud.com/#/c/43462/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/43462/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="314260" author="gerrit" created="Wed, 29 Sep 2021 09:58:43 +0000"  >&lt;p&gt;&quot;Shaun Tancheff &amp;lt;shaun.tancheff@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/45086&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45086&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14402&quot; title=&quot;LBUG: osd_write_commit() ASSERTION( !PageDirty(lnb[i].lnb_page) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14402&quot;&gt;&lt;del&gt;LU-14402&lt;/del&gt;&lt;/a&gt; osd-ldiskfs: Page cache pages dirtied in writeback&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 3d35690a18d558be68e1701c71f9f02901125cf8&lt;/p&gt;</comment>
                            <comment id="314261" author="gerrit" created="Wed, 29 Sep 2021 09:58:44 +0000"  >&lt;p&gt;&quot;Shaun Tancheff &amp;lt;shaun.tancheff@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/45087&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45087&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14402&quot; title=&quot;LBUG: osd_write_commit() ASSERTION( !PageDirty(lnb[i].lnb_page) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14402&quot;&gt;&lt;del&gt;LU-14402&lt;/del&gt;&lt;/a&gt; osd-ldiskfs: disable pagecache bypass feature&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 060e753054494e44eb15bef9695d9038ba834a4e&lt;/p&gt;</comment>
                            <comment id="314339" author="adilger" created="Wed, 29 Sep 2021 20:49:06 +0000"  >&lt;p&gt;&lt;del&gt;Shaun, this same &lt;tt&gt;ASSERTION()&lt;/tt&gt; was reported fixed via patch &lt;a href=&quot;https://review.whamcloud.com/43462&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43462&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14640&quot; title=&quot;ASSERTION( !PageDirty(lnb[i].lnb_page) in osd_write_commit()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14640&quot;&gt;&lt;del&gt;LU-14640&lt;/del&gt;&lt;/a&gt; osd: ASSERTION(!PageDirty(lnb&lt;span class=&quot;error&quot;&gt;&amp;#91;i&amp;#93;&lt;/span&gt;.lnb_page)&lt;/tt&gt;&quot;.&lt;/del&gt;&lt;/p&gt;

&lt;p&gt;&lt;del&gt;The problem wasn&apos;t so much the uncached IO patches that you are reverting as that &lt;tt&gt;fallocate()&lt;/tt&gt; wasn&apos;t cleaning up partially-zeroed pages in the cache.&lt;/del&gt;&lt;/p&gt;

&lt;p&gt;Ah, I see your addendum that this patch is included in your recent failure.  Do you have any details of your workload that is triggering this error?  We&apos;ve been running with the uncached IO patches for many months without any similar reports in the field, so there must be something specific in your workload that is triggering it.&lt;/p&gt;</comment>
                            <comment id="314448" author="stancheff" created="Thu, 30 Sep 2021 19:19:54 +0000"  >&lt;p&gt;The crash hits quite early (30 minutes or so) in our io-stress suite. The suite is large with bits of unaligned I/O mixed in doing to usual aio/dio, mmap, ior, and ltp tests.&lt;/p&gt;
</comment>
                            <comment id="316372" author="stancheff" created="Fri, 22 Oct 2021 18:24:25 +0000"  >&lt;p&gt;As of 14d07b6237 this did not reproduce.&lt;/p&gt;</comment>
                            <comment id="316415" author="adilger" created="Sat, 23 Oct 2021 01:34:09 +0000"  >&lt;p&gt;The range v2_14_55-52..14d07b6237 contains 87 patches, but if this is restricted to changes to &lt;tt&gt;lustre/osd-ldiskfs&lt;/tt&gt; and &lt;tt&gt;lustre/ofd&lt;/tt&gt; the list is more manageable:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[root@centos7 lustre-copy]# git log --oneline v2_14_55~$((98-52))..14d07b6237 lustre/osd-ldiskfs  lustre/ofd
5daf86607877 LU-12268 osd: BUG_ON for IAM corruption
882a9f784de2 LU-14927 scrub: create shared scrub_needs_check() function.
0daeebcbdc4e LU-14797 nodemap: map project id
bbfdc7c1670c LU-14739 quota: fix quota with root squash enabled
bb5d81ea9550 LU-14543 target: prevent overflowing of tgd-&amp;gt;tgd_tot_granted
da1d93513fdf LU-14475 log: Rewrite some log messages
2a24b6ec67da LU-14734 ldiskfs: improve message for large_dir
7fdd664b3518 LU-14895 osd-ldiskfs: combine checksum functions
c18d5d892b62 LU-14889 lproc: Add server checksum_type
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;The patch &lt;a href=&quot;https://review.whamcloud.com/45072&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45072&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12268&quot; title=&quot;LDISKFS-fs error: ldiskfs_find_dest_de:2066: bad entry in directory: rec_len is smaller than minimal - offset=0( 0), inode=201, rec_len=0, name_len=0&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12268&quot;&gt;&lt;del&gt;LU-12268&lt;/del&gt;&lt;/a&gt; osd: BUG_ON for IAM corruption&lt;/tt&gt;&quot; which might &quot;prevent&quot; memory corruption in some cases, but it would trigger &lt;tt&gt;BUG_ON()&lt;/tt&gt; instead, because the patch doesn&apos;t actually fix the core problem.&lt;/p&gt;

&lt;p&gt;Other than that, I don&apos;t really have any concrete suggestions other than to try bisect, if you want to figure out which patch fixed the problem.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="63928">LU-14640</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01liv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>