<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:29:54 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-9857] sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &lt;= end )</title>
                <link>https://jira.whamcloud.com/browse/LU-9857</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Jinshan Xiong &amp;lt;jinshan.xiong@intel.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/5ab79694-7d98-11e7-9e43-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/5ab79694-7d98-11e7-9e43-5254006e85c2&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;The sub-test test_35 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;test failed to respond and timed out
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Please provide additional information about the failure here.&lt;/p&gt;

&lt;p&gt;Info required for matching: sanityn 35&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;23:46:36:[ 7850.159072] LustreError: 29261:0:(libcfs_fail.h:165:cfs_race()) cfs_race id 318 sleeping
23:46:36:[ 7850.166021] LustreError: 30957:0:(libcfs_fail.h:170:cfs_race()) cfs_fail_race id 318 waking
23:46:36:[ 7850.170410] LustreError: 29261:0:(libcfs_fail.h:168:cfs_race()) cfs_fail_race id 318 awake, rc=0
23:46:36:[ 7850.174782] LustreError: 29261:0:(mdc_request.c:1328:mdc_read_page()) lustre-MDT0000-mdc-ffff880067c40000: [0x200007164:0x6:0x0] lock enqueue fails: rc = -4
23:46:36:[ 7850.182752] Lustre: dir [0x2c00013a0:0xa:0x0] stripe 1 readdir failed: -4, directory is partially accessed!
23:46:36:[ 7850.191827] LustreError: 29261:0:(lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end ) failed: 
23:46:36:[ 7850.196278] LustreError: 29261:0:(lmv_obd.c:2122:stripe_dirent_next()) LBUG
23:46:36:[ 7850.199151] Pid: 29261, comm: ls
23:46:36:[ 7850.202731] 
23:46:36:[ 7850.202731] Call Trace:
23:46:36:[ 7850.209235]  [&amp;lt;ffffffffa070b7ee&amp;gt;] libcfs_call_trace+0x4e/0x60 [libcfs]
23:46:36:[ 7850.212997]  [&amp;lt;ffffffffa070b87c&amp;gt;] lbug_with_loc+0x4c/0xb0 [libcfs]
23:46:36:[ 7850.216695]  [&amp;lt;ffffffffa095f07c&amp;gt;] stripe_dirent_next+0x33c/0x922 [lmv]
23:46:36:[ 7850.220405]  [&amp;lt;ffffffffa095f8d9&amp;gt;] lmv_striped_read_page.isra.29+0x277/0x5e8 [lmv]
23:46:36:[ 7850.223563]  [&amp;lt;ffffffffa094c503&amp;gt;] lmv_read_page+0x4e3/0x550 [lmv]
23:46:36:[ 7850.226019]  [&amp;lt;ffffffffa0c2d6a8&amp;gt;] ll_get_dir_page+0xc8/0x380 [lustre]
23:46:36:[ 7850.228433]  [&amp;lt;ffffffffa0c6bf20&amp;gt;] ? ll_md_blocking_ast+0x0/0x730 [lustre]
23:46:36:[ 7850.230825]  [&amp;lt;ffffffffa0c2dc34&amp;gt;] ll_dir_read+0x214/0x320 [lustre]
23:46:36:[ 7850.233247]  [&amp;lt;ffffffff81212c00&amp;gt;] ? filldir+0x0/0xf0
23:46:36:[ 7850.235466]  [&amp;lt;ffffffff81212c00&amp;gt;] ? filldir+0x0/0xf0
23:46:36:[ 7850.237609]  [&amp;lt;ffffffffa0c2de59&amp;gt;] ll_readdir+0x119/0x4f0 [lustre]
23:46:36:[ 7850.239809]  [&amp;lt;ffffffff81212c00&amp;gt;] ? filldir+0x0/0xf0
23:46:36:[ 7850.241879]  [&amp;lt;ffffffff81212af0&amp;gt;] vfs_readdir+0xb0/0xe0
23:46:36:[ 7850.243937]  [&amp;lt;ffffffff81212f15&amp;gt;] SyS_getdents+0x95/0x120
23:46:36:[ 7850.246042]  [&amp;lt;ffffffff81697809&amp;gt;] system_call_fastpath+0x16/0x1b
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;The kernel on client node crashed.&lt;/p&gt;</description>
                <environment></environment>
        <key id="47751">LU-9857</key>
            <summary>sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &lt;= end )</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Thu, 10 Aug 2017 17:59:36 +0000</created>
                <updated>Thu, 4 Jun 2020 21:40:06 +0000</updated>
                            <resolved>Sat, 12 May 2018 05:44:31 +0000</resolved>
                                    <version>Lustre 2.11.0</version>
                                    <fixVersion>Lustre 2.12.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>13</watches>
                                                                            <comments>
                            <comment id="205129" author="jay" created="Fri, 11 Aug 2017 05:17:23 +0000"  >&lt;p&gt;another occurrence: &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/01bb5028-7e45-11e7-96ed-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/01bb5028-7e45-11e7-96ed-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="205148" author="jhammond" created="Fri, 11 Aug 2017 14:14:14 +0000"  >&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sessions/00c6ff85-4aa2-4b28-a0ae-55073c579736&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sessions/00c6ff85-4aa2-4b28-a0ae-55073c579736&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;This assertion was added by &lt;a href=&quot;https://review.whamcloud.com/27663&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/27663&lt;/a&gt; &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-5106&quot; title=&quot;Test failure sanity test_123a: ls 10000 files is slower with statahead!&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-5106&quot;&gt;&lt;del&gt;LU-5106&lt;/del&gt;&lt;/a&gt; readdir: improve striped readdir.&lt;/p&gt;</comment>
                            <comment id="205149" author="jhammond" created="Fri, 11 Aug 2017 14:23:02 +0000"  >&lt;p&gt;Lai, I understand that this change is trying to return as many of the directory entries as possible in case of errors. But &lt;tt&gt;stripe_dirent_next()&lt;/tt&gt; must propagate errors from &lt;tt&gt;mdc_read_page()&lt;/tt&gt; up to the application. But currently it discards the return value of &lt;tt&gt;mdc_read_page()&lt;/tt&gt; and none of its callers use the its own return value.&lt;/p&gt;</comment>
                            <comment id="205257" author="wangshilong" created="Sun, 13 Aug 2017 14:04:55 +0000"  >&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/ff7b28d4-8023-11e7-bbc6-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/ff7b28d4-8023-11e7-bbc6-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="205287" author="laisiyao" created="Mon, 14 Aug 2017 03:18:04 +0000"  >&lt;p&gt;I see, I&apos;ll work on it.&lt;/p&gt;</comment>
                            <comment id="205394" author="gerrit" created="Tue, 15 Aug 2017 03:22:41 +0000"  >&lt;p&gt;Lai Siyao (lai.siyao@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/28548&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/28548&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9857&quot; title=&quot;sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9857&quot;&gt;&lt;del&gt;LU-9857&lt;/del&gt;&lt;/a&gt; lmv: stripe dir page may be released mistakenly&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: ff1e9e251f027c044d7853ff920dd31c4b3d1888&lt;/p&gt;</comment>
                            <comment id="205415" author="sguminsx" created="Tue, 15 Aug 2017 10:52:08 +0000"  >&lt;p&gt;Another on master:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sessions/d7870a08-73b3-4f95-898b-f4f0908c9214&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sessions/d7870a08-73b3-4f95-898b-f4f0908c9214&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="206563" author="gerrit" created="Mon, 28 Aug 2017 06:27:15 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/28548/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/28548/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9857&quot; title=&quot;sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9857&quot;&gt;&lt;del&gt;LU-9857&lt;/del&gt;&lt;/a&gt; lmv: stripe dir page may be released mistakenly&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: beadbad429aeffa66898bd62cc99e76290644ca8&lt;/p&gt;</comment>
                            <comment id="206619" author="pjones" created="Mon, 28 Aug 2017 14:59:26 +0000"  >&lt;p&gt;Landed for 2.11&lt;/p&gt;</comment>
                            <comment id="207026" author="bzzz" created="Thu, 31 Aug 2017 04:39:55 +0000"  >&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/7fe3bcd4-8d99-11e7-b4f3-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/7fe3bcd4-8d99-11e7-b4f3-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="214978" author="yong.fan" created="Thu, 30 Nov 2017 00:06:08 +0000"  >&lt;p&gt;+1 on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sessions/e9580a21-afc8-493a-90f6-be7f0e47bc94&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sessions/e9580a21-afc8-493a-90f6-be7f0e47bc94&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_logs/ca1d75b8-d53f-11e7-8027-52540065bddc/show_text&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_logs/ca1d75b8-d53f-11e7-8027-52540065bddc/show_text&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="216023" author="bfaccini" created="Tue, 12 Dec 2017 08:10:01 +0000"  >&lt;p&gt;+1 on latest master : &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/8182cffe-dee7-11e7-9840-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/8182cffe-dee7-11e7-9840-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="216223" author="adilger" created="Wed, 13 Dec 2017 22:55:19 +0000"  >&lt;p&gt;Just hit this again on master, dated 2017-12-09:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/ebf98b0c-dd34-11e7-9c63-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/ebf98b0c-dd34-11e7-9c63-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="216681" author="laisiyao" created="Tue, 19 Dec 2017 02:41:21 +0000"  >&lt;p&gt;I don&apos;t see this assert in all the failures, but timeout, so I&apos;m afraid it&apos;s a different issue. And unluckily these timeout failures don&apos;t leave any logs, I&apos;ll try to reproduce it first.&lt;/p&gt;</comment>
                            <comment id="218486" author="bfaccini" created="Thu, 18 Jan 2018 08:28:15 +0000"  >&lt;p&gt;+1 with latest master at &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/e3801c38-fc16-11e7-bd00-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/e3801c38-fc16-11e7-bd00-52540065bddc&lt;/a&gt;.&lt;br/&gt;
Lai, to find the LBUG just look for sanityn/test_35 related outputs in Client&apos;s Console log.&lt;/p&gt;</comment>
                            <comment id="218718" author="yujian" created="Fri, 19 Jan 2018 23:21:58 +0000"  >&lt;p&gt;+1 on master branch:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/49b96ede-fcdd-11e7-a7cd-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/49b96ede-fcdd-11e7-a7cd-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="218782" author="yong.fan" created="Mon, 22 Jan 2018 01:50:50 +0000"  >&lt;p&gt;+1 on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/44775e1e-fe03-11e7-a10a-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/44775e1e-fe03-11e7-a10a-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="220437" author="yujian" created="Thu, 8 Feb 2018 17:22:54 +0000"  >&lt;p&gt;+1 on master branch:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/6667a692-0cd5-11e8-bd00-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/6667a692-0cd5-11e8-bd00-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="223654" author="sarah" created="Wed, 14 Mar 2018 22:13:42 +0000"  >&lt;p&gt;on master tag-2.10.59&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/38bd33e4-2786-11e8-b6a0-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/38bd33e4-2786-11e8-b6a0-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="226492" author="jamesanunez" created="Fri, 20 Apr 2018 18:08:29 +0000"  >&lt;p&gt;All recent failures look like they are for DNE configurations. Here are some recent failures with links to logs and core files:&lt;/p&gt;

&lt;p&gt;Logs at &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/614c9d28-444f-11e8-95c0-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/614c9d28-444f-11e8-95c0-52540065bddc&lt;/a&gt;&lt;br/&gt;
Core file can be found in /scratch/dumps/trevis-4vm8.trevis.hpdd.intel.com/10.9.4.36-2018-04-20-03:58:14&lt;/p&gt;

&lt;p&gt;Logs at &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/1cf4c6b6-42a9-11e8-8f8a-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/1cf4c6b6-42a9-11e8-8f8a-52540065bddc&lt;/a&gt;&lt;br/&gt;
Core file can be found in /scratch/dumps/trevis-44vm1.trevis.hpdd.intel.com/10.9.6.10-2018-04-18-01:35:14&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/1cf4c6b6-42a9-11e8-8f8a-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/1cf4c6b6-42a9-11e8-8f8a-52540065bddc&lt;/a&gt;&lt;br/&gt;
Core file can be found in /scratch/dumps/trevis-44vm1.trevis.hpdd.intel.com/10.9.6.10-2018-04-18-01:35:14&lt;/p&gt;</comment>
                            <comment id="226602" author="laisiyao" created="Tue, 24 Apr 2018 07:08:42 +0000"  >&lt;p&gt;James, the links of the the 2nd and the 3rd are duplicate. And the 1st looks to be another issue:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[10146.583339] Lustre: DEBUG MARKER: == sanityn test 16a: 500 iterations of dual-mount fsx ================================================ 03:55:24 (1524196524)
[10252.159310] NMI watchdog: BUG: soft lockup - CPU#1 stuck for 23s! [ll_ost_io00_003:23498]
[10252.159310] Modules linked in: osp(OE) ofd(OE) lfsck(OE) ost(OE) mgc(OE) osd_zfs(OE) lquota(OE) fid(OE) fld(OE) ksocklnd(OE) ptlrpc(OE) obdclass(OE) lnet(OE) libcfs(OE) rpcsec_gss_krb5 nfsv4 dns_resolver nfs fscache rpcrdma ib_isert iscsi_target_mod ib_iser libiscsi scsi_transport_iscsi ib_srpt target_core_mod crc_t10dif crct10dif_generic ib_srp scsi_transport_srp scsi_tgt ib_ipoib rdma_ucm ib_ucm ib_uverbs ib_umad rdma_cm ib_cm iw_cm ib_core dm_mod zfs(POE) zunicode(POE) zavl(POE) icp(POE) iosf_mbi crc32_pclmul ghash_clmulni_intel zcommon(POE) znvpair(POE) ppdev spl(OE) aesni_intel lrw gf128mul glue_helper ablk_helper cryptd joydev virtio_balloon pcspkr i2c_piix4 parport_pc parport nfsd nfs_acl lockd grace auth_rpcgss sunrpc ip_tables ext4 mbcache jbd2 ata_generic pata_acpi ata_piix virtio_blk cirrus drm_kms_helper libata syscopyarea sysfillrect 8139too sysimgblt fb_sys_fops ttm crct10dif_pclmul crct10dif_common drm crc32c_intel serio_raw virtio_pci virtio_ring virtio 8139cp i2c_core mii floppy
[10252.159310] CPU: 1 PID: 23498 Comm: ll_ost_io00_003 Tainted: P           OE  ------------   3.10.0-693.21.1.el7_lustre.x86_64 #1
[10252.159310] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2007
[10252.159310] task: ffff880059e56eb0 ti: ffff880059538000 task.ti: ffff880059538000
[10252.159310] RIP: 0010:[&amp;lt;ffffffff81337f93&amp;gt;]  [&amp;lt;ffffffff81337f93&amp;gt;] memset+0x33/0xb0
[10252.159310] RSP: 0018:ffff88005953b820  EFLAGS: 00010212
[10252.159310] RAX: 0000000000000000 RBX: 0000000000000000 RCX: 0000000000000fbf
[10252.159310] RDX: 0000000000100000 RSI: 0000000000000000 RDI: ffffc900140ec000
[10252.159310] RBP: ffff88005953b8c0 R08: ffff880036aab690 R09: 0000000000000000
[10252.159310] R10: ffffc9001402b000 R11: ffffea000116bc00 R12: ffffffffc04a7d3b
[10252.159310] R13: ffff88005953b7b0 R14: ffff880059a5b000 R15: ffffffffc056e667
[10252.159310] FS:  0000000000000000(0000) GS:ffff88007fd00000(0000) knlGS:0000000000000000
[10252.159310] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[10252.159310] CR2: 00007fd2559ae000 CR3: 0000000079462000 CR4: 00000000000606e0
[10252.159310] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
[10252.159310] DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
[10252.159310] Call Trace:
[10252.159310]  [&amp;lt;ffffffffc04b2cc7&amp;gt;] ? dbuf_read+0x397/0x9e0 [zfs]
[10252.159310]  [&amp;lt;ffffffffc0575128&amp;gt;] ? zio_done+0x748/0xd20 [zfs]
[10252.159310]  [&amp;lt;ffffffffc056eb8c&amp;gt;] ? zio_destroy+0x7c/0x80 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04b66d9&amp;gt;] dmu_buf_will_dirty+0x119/0x130 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04bcf15&amp;gt;] dmu_write_impl+0x45/0xd0 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04beb57&amp;gt;] dmu_write.part.7+0xa7/0x110 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04bed36&amp;gt;] dmu_assign_arcbuf+0x156/0x1a0 [zfs]
[10252.159310]  [&amp;lt;ffffffffc10cfdcd&amp;gt;] osd_write_commit+0x46d/0xa00 [osd_zfs]
[10252.159310]  [&amp;lt;ffffffffc120b29a&amp;gt;] ofd_commitrw_write+0xf9a/0x1d00 [ofd]
[10252.159310]  [&amp;lt;ffffffffc120f112&amp;gt;] ofd_commitrw+0x4b2/0xa10 [ofd]
[10252.159310]  [&amp;lt;ffffffffc0c36c39&amp;gt;] ? lprocfs_counter_add+0xf9/0x160 [obdclass]
[10252.159310]  [&amp;lt;ffffffffc0ef8430&amp;gt;] tgt_brw_write+0x1180/0x1d70 [ptlrpc]
[10252.159310] INFO: rcu_sched detected stalls on CPUs/tasks:
[10252.159310]  [&amp;lt;ffffffffc0e4b940&amp;gt;] ? target_send_reply_msg+0x170/0x170 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0ef994a&amp;gt;] tgt_request_handle+0x92a/0x13b0 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0e9da53&amp;gt;] ptlrpc_server_handle_request+0x253/0xab0 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffff810bdc4b&amp;gt;] ? __wake_up_common+0x5b/0x90
[10252.159310]  [&amp;lt;ffffffffc0ea1202&amp;gt;] ptlrpc_main+0xa92/0x1f40 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0ea0770&amp;gt;] ? ptlrpc_register_service+0xe90/0xe90 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffff810b4031&amp;gt;] kthread+0xd1/0xe0
[10252.159310]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
[10252.159310]  [&amp;lt;ffffffff816c0577&amp;gt;] ret_from_fork+0x77/0xb0
[10252.159310]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
[10252.159310] Code: b8 01 01 01 01 01 01 01 01 48 0f af c1 41 89 f9 41 83 e1 07 75 70 48 89 d1 48 c1 e9 06 74 39 66 0f 1f 84 00 00 00 00 00 48 ff c9 &amp;lt;48&amp;gt; 89 07 48 89 47 08 48 89 47 10 48 89 47 18 48 89 47 20 48 89 
[10252.159310] Kernel panic - not syncing: softlockup: hung tasks
[10274.555013]  { 1[10252.159310] CPU: 1 PID: 23498 Comm: ll_ost_io00_003 Tainted: P           OEL ------------   3.10.0-693.21.1.el7_lustre.x86_64 #1
[10252.159310] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2007
[10252.159310] Call Trace:
[10252.159310]  &amp;lt;IRQ&amp;gt;  [&amp;lt;ffffffff816ae7c8&amp;gt;] dump_stack+0x19/0x1b
[10252.159310]  [&amp;lt;ffffffff816a8634&amp;gt;] panic+0xe8/0x21f
[10252.159310]  [&amp;lt;ffffffff8102d7cf&amp;gt;] ? show_regs+0x5f/0x210
[10252.159310]  [&amp;lt;ffffffff811334e1&amp;gt;] watchdog_timer_fn+0x231/0x240
[10252.159310]  [&amp;lt;ffffffff811332b0&amp;gt;] ? watchdog+0x40/0x40
[10252.159310]  [&amp;lt;ffffffff810b8196&amp;gt;] __hrtimer_run_queues+0xd6/0x260
[10252.159310]  [&amp;lt;ffffffff810b872f&amp;gt;] hrtimer_interrupt+0xaf/0x1d0
[10252.159310]  [&amp;lt;ffffffff8105467b&amp;gt;] local_apic_timer_interrupt+0x3b/0x60
[10252.159310]  [&amp;lt;ffffffff816c4e73&amp;gt;] smp_apic_timer_interrupt+0x43/0x60
[10252.159310]  [&amp;lt;ffffffff816c1732&amp;gt;] apic_timer_interrupt+0x162/0x170
[10252.159310]  &amp;lt;EOI&amp;gt;  [&amp;lt;ffffffff81337f93&amp;gt;] ? memset+0x33/0xb0
[10252.159310]  [&amp;lt;ffffffffc04b2cc7&amp;gt;] ? dbuf_read+0x397/0x9e0 [zfs]
[10252.159310]  [&amp;lt;ffffffffc0575128&amp;gt;] ? zio_done+0x748/0xd20 [zfs]
[10252.159310]  [&amp;lt;ffffffffc056eb8c&amp;gt;] ? zio_destroy+0x7c/0x80 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04b66d9&amp;gt;] dmu_buf_will_dirty+0x119/0x130 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04bcf15&amp;gt;] dmu_write_impl+0x45/0xd0 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04beb57&amp;gt;] dmu_write.part.7+0xa7/0x110 [zfs]
[10252.159310]  [&amp;lt;ffffffffc04bed36&amp;gt;] dmu_assign_arcbuf+0x156/0x1a0 [zfs]
[10252.159310]  [&amp;lt;ffffffffc10cfdcd&amp;gt;] osd_write_commit+0x46d/0xa00 [osd_zfs]
[10252.159310]  [&amp;lt;ffffffffc120b29a&amp;gt;] ofd_commitrw_write+0xf9a/0x1d00 [ofd]
[10252.159310]  [&amp;lt;ffffffffc120f112&amp;gt;] ofd_commitrw+0x4b2/0xa10 [ofd]
[10252.159310]  [&amp;lt;ffffffffc0c36c39&amp;gt;] ? lprocfs_counter_add+0xf9/0x160 [obdclass]
[10252.159310]  [&amp;lt;ffffffffc0ef8430&amp;gt;] tgt_brw_write+0x1180/0x1d70 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0e4b940&amp;gt;] ? target_send_reply_msg+0x170/0x170 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0ef994a&amp;gt;] tgt_request_handle+0x92a/0x13b0 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0e9da53&amp;gt;] ptlrpc_server_handle_request+0x253/0xab0 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffff810bdc4b&amp;gt;] ? __wake_up_common+0x5b/0x90
[10252.159310]  [&amp;lt;ffffffffc0ea1202&amp;gt;] ptlrpc_main+0xa92/0x1f40 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffffc0ea0770&amp;gt;] ? ptlrpc_register_service+0xe90/0xe90 [ptlrpc]
[10252.159310]  [&amp;lt;ffffffff810b4031&amp;gt;] kthread+0xd1/0xe0
[10252.159310]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
[10252.159310]  [&amp;lt;ffffffff816c0577&amp;gt;] ret_from_fork+0x77/0xb0
[10252.159310]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40

[10274.555013] } (detected by 0, t=60299 jiffies, g=942723, c=942722, q=34)
[10274.555013] Task dump for CPU 1:
[10274.555013] ll_ost_io00_003 R  running task        0 23498      2 0x00000088
[10274.555013] Call Trace:
[10274.555013]  [&amp;lt;ffffffffc04bed36&amp;gt;] ? dmu_assign_arcbuf+0x156/0x1a0 [zfs]
[10274.555013]  [&amp;lt;ffffffffc10cfdcd&amp;gt;] ? osd_write_commit+0x46d/0xa00 [osd_zfs]
[10274.555013]  [&amp;lt;ffffffffc120b29a&amp;gt;] ? ofd_commitrw_write+0xf9a/0x1d00 [ofd]
[10274.555013]  [&amp;lt;ffffffffc120f112&amp;gt;] ? ofd_commitrw+0x4b2/0xa10 [ofd]
[10274.555013]  [&amp;lt;ffffffffc0c36c39&amp;gt;] ? lprocfs_counter_add+0xf9/0x160 [obdclass]
[10274.555013]  [&amp;lt;ffffffffc0ef8430&amp;gt;] ? tgt_brw_write+0x1180/0x1d70 [ptlrpc]
[10274.555013]  [&amp;lt;ffffffffc0e4b940&amp;gt;] ? target_send_reply_msg+0x170/0x170 [ptlrpc]
[10274.555013]  [&amp;lt;ffffffffc0ef994a&amp;gt;] ? tgt_request_handle+0x92a/0x13b0 [ptlrpc]
[10274.555013]  [&amp;lt;ffffffffc0e9da53&amp;gt;] ? ptlrpc_server_handle_request+0x253/0xab0 [ptlrpc]
[10274.555013]  [&amp;lt;ffffffff810bdc4b&amp;gt;] ? __wake_up_common+0x5b/0x90
[10274.555013]  [&amp;lt;ffffffffc0ea1202&amp;gt;] ? ptlrpc_main+0xa92/0x1f40 [ptlrpc]
[10274.555013]  [&amp;lt;ffffffffc0ea0770&amp;gt;] ? ptlrpc_register_service+0xe90/0xe90 [ptlrpc]
[10274.555013]  [&amp;lt;ffffffff810b4031&amp;gt;] ? kthread+0xd1/0xe0
[10274.555013]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
[10274.555013]  [&amp;lt;ffffffff816c0577&amp;gt;] ? ret_from_fork+0x77/0xb0
[10274.555013]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="226770" author="laisiyao" created="Thu, 26 Apr 2018 04:01:17 +0000"  >&lt;p&gt;I found something strange in the dump:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;crash&amp;gt; struct lu_dirpage 0xffff8800a6631000
struct lu_dirpage {
  ldp_hash_start = 16131858539135107072,
  ldp_hash_end = 8850982375266543352,
  ldp_flags = 0,
  ldp_pad0 = 0,
  ldp_entries = 0xffff8800a6631018
}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This shows in one of the dir page read, its start hash is bigger than end hash, which causes the LASSERT in the code. I&apos;ve added some debug code and trying to reproduce it.&lt;/p&gt;</comment>
                            <comment id="226871" author="gerrit" created="Fri, 27 Apr 2018 16:27:21 +0000"  >&lt;p&gt;Lai Siyao (lai.siyao@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/32180&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32180&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9857&quot; title=&quot;sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9857&quot;&gt;&lt;del&gt;LU-9857&lt;/del&gt;&lt;/a&gt; lmv: dir page is released while in use&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: dc6e38453c0fd50ce1b094d3aa348c0ab7efcdde&lt;/p&gt;</comment>
                            <comment id="227754" author="gerrit" created="Sat, 12 May 2018 03:52:35 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/32180/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32180/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9857&quot; title=&quot;sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9857&quot;&gt;&lt;del&gt;LU-9857&lt;/del&gt;&lt;/a&gt; lmv: dir page is released while in use&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: b51e8d6b53a3f3257fd9106ec5ec5eec302baa7f&lt;/p&gt;</comment>
                            <comment id="227769" author="pjones" created="Sat, 12 May 2018 05:44:31 +0000"  >&lt;p&gt;Landed for 2.12&lt;/p&gt;</comment>
                            <comment id="272020" author="gerrit" created="Thu, 4 Jun 2020 21:40:05 +0000"  >&lt;p&gt;Olaf Faaland-LLNL (faaland1@llnl.gov) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/38838&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38838&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9857&quot; title=&quot;sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9857&quot;&gt;&lt;del&gt;LU-9857&lt;/del&gt;&lt;/a&gt; lmv: stripe dir page may be released mistakenly&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_10&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: fddce17bbad4fe379bedf479edb60034a69af977&lt;/p&gt;</comment>
                            <comment id="272021" author="gerrit" created="Thu, 4 Jun 2020 21:40:06 +0000"  >&lt;p&gt;Olaf Faaland-LLNL (faaland1@llnl.gov) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/38839&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38839&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9857&quot; title=&quot;sanityn test_35: (lmv_obd.c:2122:stripe_dirent_next()) ASSERTION( hash &amp;lt;= end )&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9857&quot;&gt;&lt;del&gt;LU-9857&lt;/del&gt;&lt;/a&gt; lmv: dir page is released while in use&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_10&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: a489fb1afa69e5a695e26219ce0fb1d12b73a4f5&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="48004">LU-9923</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzi9j:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>