<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:08:47 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14326] sanity-dom test_fsx: crash in osc_extent_make_ready()</title>
                <link>https://jira.whamcloud.com/browse/LU-14326</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Andreas Dilger  &amp;lt;adilger@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/393c6362-298e-472f-be95-f23a1892e9df&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/393c6362-298e-472f-be95-f23a1892e9df&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_fsx failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;trevis-209vm6 crashed during sanity-dom test_fsx

[14491.172043] LustreError: 813:0:(osc_cache.c:1113:osc_extent_make_ready()) ASSERTION( last_oap_count &amp;gt; 0 ) failed: 
[14491.173797] LustreError: 813:0:(osc_cache.c:1113:osc_extent_make_ready()) LBUG
[14491.174924] Pid: 813, comm: ldlm_bl_06 3.10.0-1127.19.1.el7.x86_64 #1 SMP Tue Aug 25 17:23:54 UTC 2020
[14491.176409] Call Trace:
[14491.176839]  [&amp;lt;ffffffffc06e867c&amp;gt;] libcfs_call_trace+0x8c/0xc0 [libcfs]
[14491.177945]  [&amp;lt;ffffffffc06e899c&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
[14491.178941]  [&amp;lt;ffffffffc0cdf284&amp;gt;] osc_extent_make_ready+0xb64/0xe50 [osc]
[14491.180097]  [&amp;lt;ffffffffc0ce228b&amp;gt;] osc_io_unplug0+0xeeb/0x1900 [osc]
[14491.181117]  [&amp;lt;ffffffffc0ce6930&amp;gt;] osc_cache_writeback_range+0x9a0/0xfd0 [osc]
[14491.182254]  [&amp;lt;ffffffffc0cd1925&amp;gt;] osc_lock_flush+0x195/0x290 [osc]
[14491.183251]  [&amp;lt;ffffffffc0cd1df8&amp;gt;] osc_ldlm_blocking_ast+0x2f8/0x3e0 [osc]
[14491.184337]  [&amp;lt;ffffffffc0ac713a&amp;gt;] ldlm_cancel_callback+0x8a/0x310 [ptlrpc]
[14491.185607]  [&amp;lt;ffffffffc0ad2dd1&amp;gt;] ldlm_cli_cancel_local+0xd1/0x420 [ptlrpc]
[14491.186747]  [&amp;lt;ffffffffc0ad8fec&amp;gt;] ldlm_cli_cancel+0x10c/0x550 [ptlrpc]
[14491.187822]  [&amp;lt;ffffffffc0cd1c7a&amp;gt;] osc_ldlm_blocking_ast+0x17a/0x3e0 [osc]
[14491.189143]  [&amp;lt;ffffffffc0add6e8&amp;gt;] ldlm_handle_bl_callback+0xc8/0x3e0 [ptlrpc]
[14491.190361]  [&amp;lt;ffffffffc0addf9f&amp;gt;] ldlm_bl_thread_main+0x59f/0xaa0 [ptlrpc]
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;





&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
sanity-dom test_fsx - trevis-209vm6 crashed during sanity-dom test_fsx&lt;/p&gt;</description>
                <environment></environment>
        <key id="62314">LU-14326</key>
            <summary>sanity-dom test_fsx: crash in osc_extent_make_ready()</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Tue, 12 Jan 2021 06:04:44 +0000</created>
                <updated>Sat, 23 Jan 2021 10:31:51 +0000</updated>
                            <resolved>Fri, 22 Jan 2021 20:58:37 +0000</resolved>
                                    <version>Lustre 2.14.0</version>
                                    <fixVersion>Lustre 2.14.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="289334" author="jhammond" created="Tue, 12 Jan 2021 21:38:47 +0000"  >&lt;p&gt;This assertion can be reproduced outside of sanity-dom:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;${LUSTRE}/tests/llmount.sh
touch /mnt/lustre/f0
fsx -c 50 -p 100 -N 1000 -l 1048576 -S 0 -d -d /mnt/lustre/f0
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;On my system it takes fewer ~5 runs of fsx.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 1456.917867] LustreError: 6997:0:(osc_cache.c:1113:osc_extent_make_ready()) ASSERTION( last_oap_count &amp;gt; 0 ) failed: 
[ 1456.920595] LustreError: 6997:0:(osc_cache.c:1113:osc_extent_make_ready()) LBUG
[ 1456.922471] Pid: 6997, comm: fsx 3.10.0-1062.9.1.el7.x86_64.debug #1 SMP Mon Mar 16 12:44:56 CDT 2020
[ 1456.924801] Call Trace:
[ 1456.925471]  [&amp;lt;ffffffffc06c2d4c&amp;gt;] libcfs_call_trace+0x8c/0xc0 [libcfs]
[ 1456.927163]  [&amp;lt;ffffffffc06c306c&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
[ 1456.928725]  [&amp;lt;ffffffffc0e025e4&amp;gt;] osc_extent_make_ready+0xb64/0xe50 [osc]
[ 1456.930547]  [&amp;lt;ffffffffc0e05603&amp;gt;] osc_io_unplug0+0xee3/0x1910 [osc]
[ 1456.932230]  [&amp;lt;ffffffffc0e09d10&amp;gt;] osc_cache_writeback_range+0x9a0/0xfd0 [osc]
[ 1456.934128]  [&amp;lt;ffffffffc0df8745&amp;gt;] osc_io_fsync_start+0x85/0x1a0 [osc]
[ 1456.935852]  [&amp;lt;ffffffffc08efa10&amp;gt;] cl_io_start+0x70/0x140 [obdclass]
[ 1456.937585]  [&amp;lt;ffffffffc0e49e67&amp;gt;] lov_io_call.isra.7+0x87/0x140 [lov]
[ 1456.939251]  [&amp;lt;ffffffffc0e4a026&amp;gt;] lov_io_start+0x56/0x150 [lov]
[ 1456.940703]  [&amp;lt;ffffffffc08efa10&amp;gt;] cl_io_start+0x70/0x140 [obdclass]
[ 1456.942419]  [&amp;lt;ffffffffc08f1eff&amp;gt;] cl_io_loop+0x9f/0x200 [obdclass]
[ 1456.943941]  [&amp;lt;ffffffffc14bd10b&amp;gt;] cl_sync_file_range+0x2db/0x380 [lustre]
[ 1456.945905]  [&amp;lt;ffffffffc14e081a&amp;gt;] ll_writepages+0x7a/0x200 [lustre]
[ 1456.947975]  [&amp;lt;ffffffffa1215b04&amp;gt;] do_writepages+0x24/0x50
[ 1456.949314]  [&amp;lt;ffffffffa1207e35&amp;gt;] __filemap_fdatawrite_range+0x65/0x80
[ 1456.950776]  [&amp;lt;ffffffffa1207f94&amp;gt;] filemap_write_and_wait_range+0x44/0x90
[ 1456.952472]  [&amp;lt;ffffffffc14bd240&amp;gt;] ll_fsync+0x90/0x540 [lustre]
[ 1456.953904]  [&amp;lt;ffffffffa12e5770&amp;gt;] vfs_fsync_range+0x20/0x30
[ 1456.955335]  [&amp;lt;ffffffffa124e18e&amp;gt;] SyS_msync+0x1fe/0x250
[ 1456.962318]  [&amp;lt;ffffffffa1887d4a&amp;gt;] tracesys+0xa6/0xcc
[ 1456.963771]  [&amp;lt;ffffffffffffffff&amp;gt;] 0xffffffffffffffff
[ 1456.965134] Kernel panic - not syncing: LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="289453" author="adilger" created="Thu, 14 Jan 2021 03:12:23 +0000"  >&lt;p&gt;Bobijam, could you please take a look.  This is being hit pretty regularly since &lt;tt&gt;fallocate()&lt;/tt&gt; checking has been fixed in the client, and &lt;tt&gt;fsx&lt;/tt&gt; is now properly testing that functionality.&lt;/p&gt;

&lt;p&gt;Is it possible that this LASSERT() is just wrong for &lt;tt&gt;fallocate()&lt;/tt&gt; when there are no data pages being sent in the RPC?&lt;/p&gt;</comment>
                            <comment id="289454" author="adilger" created="Thu, 14 Jan 2021 03:15:58 +0000"  >&lt;p&gt;It looks like there was a patch &lt;a href=&quot;https://review.whamcloud.com/30848&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/30848&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10407&quot; title=&quot;osc_cache.c:1141:osc_extent_make_ready()) ASSERTION( last_oap_count &amp;gt; 0 ) failed: &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10407&quot;&gt;&lt;del&gt;LU-10407&lt;/del&gt;&lt;/a&gt; osc: update size before queue page&lt;/tt&gt;&quot; pushed a couple of years ago and never landed, due to Jinshan giving it a -1.  That might give some ideas where to start.&lt;/p&gt;</comment>
                            <comment id="289482" author="green" created="Thu, 14 Jan 2021 15:25:26 +0000"  >&lt;p&gt;This is a major sanity-benchmark crashes source (in fsx) for me.&lt;/p&gt;</comment>
                            <comment id="289485" author="green" created="Thu, 14 Jan 2021 15:38:27 +0000"  >&lt;p&gt;I just also filed &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14333&quot; title=&quot;ASSERTION( oinfo-&amp;gt;loi_lvb.lvb_size &amp;gt;= oinfo-&amp;gt;loi_kms ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14333&quot;&gt;&lt;del&gt;LU-14333&lt;/del&gt;&lt;/a&gt; that seems to be related, it hits if this one did not hit, at a later point in time in cleanup.&lt;/p&gt;</comment>
                            <comment id="289545" author="adilger" created="Thu, 14 Jan 2021 22:36:06 +0000"  >&lt;p&gt;Oleg reports that the 30848 patch does not solve the fsx test issues being seen.&lt;/p&gt;</comment>
                            <comment id="289558" author="bobijam" created="Fri, 15 Jan 2021 04:22:46 +0000"  >&lt;p&gt;my test shows that #30848 only reduced the hit probability, and I got one hit may sheds some light.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;000814 1610683006.953568 write      0x09385c thru 0x098924	(0x0550c9 bytes)
000817 1610683006.954846 fallocate  0x092fd1 thru 0x09bfb3	(0x058fe3 bytes)&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;then the issue got hit with some debug info shows&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 1361.292883] LustreError: 16917:0:(osc_cache.c:1287:osc_refresh_count()) kms 602065(0x92fd1) page offset 622592(0x98000)
[ 1361.293036] LustreError: 16917:0:(osc_cache.c:1113:osc_extent_make_ready()) ASSERTION( last_oap_count &amp;gt; 0 ) failed: last_oap_count 0
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;the file&apos;s kms and fallocate offset coincides (0x092fd1), the last sync page looks from the write (0x98000 -&amp;gt; 0x98924).&lt;/p&gt;</comment>
                            <comment id="289561" author="gerrit" created="Fri, 15 Jan 2021 06:06:22 +0000"  >&lt;p&gt;&lt;del&gt;Bobi Jam (bobijam@hotmail.com) uploaded a new patch:&lt;/del&gt; &lt;a href=&quot;https://review.whamcloud.com/41233&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/41233&lt;/a&gt;&lt;br/&gt;
&lt;del&gt;Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14326&quot; title=&quot;sanity-dom test_fsx: crash in osc_extent_make_ready()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14326&quot;&gt;&lt;del&gt;LU-14326&lt;/del&gt;&lt;/a&gt; osc: correctly update size/kms for fallocate&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Project: fs/lustre-release&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Branch: master&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Current Patch Set: 3&lt;/del&gt;&lt;br/&gt;
&lt;del&gt;Commit: a202c4dbbd8dc6f763b6672a9fe604a9179f209a&lt;/del&gt;&lt;/p&gt;</comment>
                            <comment id="289562" author="bobijam" created="Fri, 15 Jan 2021 06:08:25 +0000"  >&lt;p&gt;Ran the fsx test for 1000 times with the patch, no LBUG happened again.&#160;&lt;/p&gt;</comment>
                            <comment id="289567" author="green" created="Fri, 15 Jan 2021 08:24:11 +0000"  >&lt;p&gt;please see my comment in the gerrit. it shifted failures to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14333&quot; title=&quot;ASSERTION( oinfo-&amp;gt;loi_lvb.lvb_size &amp;gt;= oinfo-&amp;gt;loi_kms ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14333&quot;&gt;&lt;del&gt;LU-14333&lt;/del&gt;&lt;/a&gt; style crashes and also now sanityn fsx tests in test_16&lt;span class=&quot;error&quot;&gt;&amp;#91;abc&amp;#93;&lt;/span&gt; are 100% failure because fsx sees wrong size.&lt;/p&gt;</comment>
                            <comment id="289638" author="bobijam" created="Fri, 15 Jan 2021 18:54:49 +0000"  >&lt;p&gt;I think the patch set 3 is a correct fix.&lt;/p&gt;</comment>
                            <comment id="289657" author="simmonsja" created="Fri, 15 Jan 2021 22:13:47 +0000"  >&lt;p&gt;I don&apos;t think this is fallocate issue. This problem has been around a long time. Its just fallocate really exposes this problem.&lt;/p&gt;</comment>
                            <comment id="289887" author="gerrit" created="Wed, 20 Jan 2021 02:03:21 +0000"  >&lt;p&gt;Bobi Jam (bobijam@hotmail.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/41272&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/41272&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14326&quot; title=&quot;sanity-dom test_fsx: crash in osc_extent_make_ready()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14326&quot;&gt;&lt;del&gt;LU-14326&lt;/del&gt;&lt;/a&gt; osc: correctly update size/kms for fallocate&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 114140000a298b9ee0e774fc1785fed034961afb&lt;/p&gt;</comment>
                            <comment id="290172" author="gerrit" created="Fri, 22 Jan 2021 20:31:40 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/41272/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/41272/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14326&quot; title=&quot;sanity-dom test_fsx: crash in osc_extent_make_ready()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14326&quot;&gt;&lt;del&gt;LU-14326&lt;/del&gt;&lt;/a&gt; osc: correctly update size/kms for fallocate&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 43979e4e257e78d3d94ea3f21b65fdebbbdc690f&lt;/p&gt;</comment>
                            <comment id="290179" author="pjones" created="Fri, 22 Jan 2021 20:58:37 +0000"  >&lt;p&gt;Landed for 2.14&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="53481">LU-11463</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="62190">LU-14286</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="62343">LU-14333</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="49916">LU-10407</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01j5j:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>