<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:19:08 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1723] osc_page_delete()) ASSERTION(0) failed</title>
                <link>https://jira.whamcloud.com/browse/LU-1723</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;LBUG on production cluster while node was running a user job.&lt;/p&gt;

&lt;p&gt;Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) page@ffff88106917b5c0&lt;span class=&quot;error&quot;&gt;&amp;#91;1 ffff8806726e8f48:1263 ^(null)_ffff88106917b500 4 0 1 (null) (null) 0x1&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) page@ffff88106917b500&lt;span class=&quot;error&quot;&gt;&amp;#91;1 ffff880770b2c4c8:1263 ^ffff88106917b5c0_(null) 4 0 1 (null) (null) 0x0&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) vvp-page@ffff8809d88c6be0(1:0:0) vm@ffffea0034f6ce20 c0000000000001 3:0 0 1263 lru&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) lov-page@ffff8809f22e93a8&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) osc-page@ffff881067d54bc8: 1&amp;lt; 0x845fed 1 0 - - + &amp;gt; 2&amp;lt; 5173248 0 4096 0x0 0x8 | (null) ffff8806d7f24688 ffff88016958f700 ffffffffa07ff&amp;gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) end page@ffff88106917b5c0&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) Trying to teardown failed: -16&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:426:osc_page_delete()) ASSERTION(0) failed&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:426:osc_page_delete()) LBUG&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: Pid: 64082, comm: calculate_propa&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel:&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: Call Trace:&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0446855&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x55/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0446e95&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x75/0xe0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0451d86&amp;gt;&amp;#93;&lt;/span&gt; libcfs_assertion_failed+0x66/0x70 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa07f8df6&amp;gt;&amp;#93;&lt;/span&gt; osc_page_delete+0x236/0x240 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0553d1e&amp;gt;&amp;#93;&lt;/span&gt; cl_page_delete0+0xce/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa055128e&amp;gt;&amp;#93;&lt;/span&gt; ? cl_env_get+0x19e/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0550bf6&amp;gt;&amp;#93;&lt;/span&gt; ? cl_env_peek+0x36/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa055408d&amp;gt;&amp;#93;&lt;/span&gt; cl_page_delete+0x3d/0xf0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0560bde&amp;gt;&amp;#93;&lt;/span&gt; ? cl_io_is_going+0xe/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:02 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08e791b&amp;gt;&amp;#93;&lt;/span&gt; ll_releasepage+0x10b/0x150 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81168ff0&amp;gt;&amp;#93;&lt;/span&gt; ? mem_cgroup_uncharge_cache_page+0x10/0x20&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811100b0&amp;gt;&amp;#93;&lt;/span&gt; try_to_release_page+0x30/0x60&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8112a4f1&amp;gt;&amp;#93;&lt;/span&gt; shrink_page_list.clone.0+0x4f1/0x5c0&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8112a8bb&amp;gt;&amp;#93;&lt;/span&gt; shrink_inactive_list+0x2fb/0x740&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8112b5cf&amp;gt;&amp;#93;&lt;/span&gt; shrink_zone+0x38f/0x520&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8112c374&amp;gt;&amp;#93;&lt;/span&gt; zone_reclaim+0x354/0x410&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8112cfc0&amp;gt;&amp;#93;&lt;/span&gt; ? isolate_pages_global+0x0/0x350&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81122874&amp;gt;&amp;#93;&lt;/span&gt; get_page_from_freelist+0x694/0x820&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81123af1&amp;gt;&amp;#93;&lt;/span&gt; __alloc_pages_nodemask+0x111/0x940&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8116a728&amp;gt;&amp;#93;&lt;/span&gt; ? __mem_cgroup_try_charge+0x78/0x420&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811586ca&amp;gt;&amp;#93;&lt;/span&gt; alloc_pages_vma+0x9a/0x150&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81172015&amp;gt;&amp;#93;&lt;/span&gt; do_huge_pmd_anonymous_page+0x145/0x370&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8113c79a&amp;gt;&amp;#93;&lt;/span&gt; handle_mm_fault+0x25a/0x2b0&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81042c29&amp;gt;&amp;#93;&lt;/span&gt; __do_page_fault+0x139/0x480&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100988e&amp;gt;&amp;#93;&lt;/span&gt; ? __switch_to+0x26e/0x320&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814ed250&amp;gt;&amp;#93;&lt;/span&gt; ? thread_return+0x4e/0x76e&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814f2c8e&amp;gt;&amp;#93;&lt;/span&gt; do_page_fault+0x3e/0xa0&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814f0045&amp;gt;&amp;#93;&lt;/span&gt; page_fault+0x25/0x30&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel:&lt;br/&gt;
Aug  8 16:00:03 sand-4-52 kernel: LustreError: dumping log to /tmp/lustre-log.1344438003.64082&lt;/p&gt;</description>
                <environment>Client RHEL-6.2  2.6.32-220.23.1.el6.x86_64</environment>
        <key id="15441">LU-1723</key>
            <summary>osc_page_delete()) ASSERTION(0) failed</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="jay">Jinshan Xiong</assignee>
                                    <reporter username="wjt27">Wojciech Turek</reporter>
                        <labels>
                    </labels>
                <created>Wed, 8 Aug 2012 11:32:09 +0000</created>
                <updated>Mon, 17 Jul 2017 18:48:40 +0000</updated>
                            <resolved>Mon, 29 May 2017 04:57:26 +0000</resolved>
                                    <version>Lustre 2.1.2</version>
                                                        <due></due>
                            <votes>2</votes>
                                    <watches>12</watches>
                                                                            <comments>
                            <comment id="42888" author="jay" created="Wed, 8 Aug 2012 16:08:08 +0000"  >&lt;p&gt;Can you please tell me what exactly version you installed on the client node?&lt;/p&gt;

&lt;p&gt;Also, this patch may help: &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1320&quot; title=&quot;EIO on read shortly after file written&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1320&quot;&gt;&lt;del&gt;LU-1320&lt;/del&gt;&lt;/a&gt; llite: fix a race between readpage and releasepage&quot;.&lt;/p&gt;</comment>
                            <comment id="42893" author="wjt27" created="Wed, 8 Aug 2012 17:09:32 +0000"  >&lt;p&gt;The clients are running lustre-2.1.2&lt;/p&gt;

&lt;p&gt;lustre-client-2.1.2-2.6.32_220.23.1.el6.x86_64.x86_64&lt;br/&gt;
lustre-client-modules-2.1.2-2.6.32_220.23.1.el6.x86_64.x86_64&lt;/p&gt;

&lt;p&gt;Lustre-2.1.2 changelog suggests that it already has a fix for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1320&quot; title=&quot;EIO on read shortly after file written&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1320&quot;&gt;&lt;del&gt;LU-1320&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="43392" author="jay" created="Thu, 16 Aug 2012 23:54:24 +0000"  >&lt;p&gt;Hi Wojciech Turek,&lt;/p&gt;

&lt;p&gt;can you please post osc_page_print() function from your source code here? Also which pages have been applied. Thanks in advance.&lt;/p&gt;</comment>
                            <comment id="43421" author="wjt27" created="Fri, 17 Aug 2012 12:58:09 +0000"  >&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;&lt;span class=&quot;code-keyword&quot;&gt;static&lt;/span&gt; &lt;span class=&quot;code-object&quot;&gt;int&lt;/span&gt; osc_page_print(&lt;span class=&quot;code-keyword&quot;&gt;const&lt;/span&gt; struct lu_env *env,
                          &lt;span class=&quot;code-keyword&quot;&gt;const&lt;/span&gt; struct cl_page_slice *slice,
                          void *cookie, lu_printer_t printer)
{
        struct osc_page       *opg = cl2osc_page(slice);
        struct osc_async_page *oap = &amp;amp;opg-&amp;gt;ops_oap;
        struct osc_object     *obj = cl2osc(slice-&amp;gt;cpl_obj);
        struct client_obd     *cli = &amp;amp;osc_export(obj)-&amp;gt;exp_obd-&amp;gt;u.cli;
        struct lov_oinfo      *loi = obj-&amp;gt;oo_oinfo;

        &lt;span class=&quot;code-keyword&quot;&gt;return&lt;/span&gt; (*printer)(env, cookie, LUSTRE_OSC_NAME&lt;span class=&quot;code-quote&quot;&gt;&quot;-page@%p: &quot;&lt;/span&gt;
                          &lt;span class=&quot;code-quote&quot;&gt;&quot;1&amp;lt; %#x %d %u %s %s %s &amp;gt; &quot;&lt;/span&gt;
                          &lt;span class=&quot;code-quote&quot;&gt;&quot;2&amp;lt; &quot;&lt;/span&gt;LPU64&lt;span class=&quot;code-quote&quot;&gt;&quot; %u %u %#x %#x | %p %p %p %p %p &amp;gt; &quot;&lt;/span&gt;
                          &lt;span class=&quot;code-quote&quot;&gt;&quot;3&amp;lt; %s %p %d %lu %d &amp;gt; &quot;&lt;/span&gt;
                          &lt;span class=&quot;code-quote&quot;&gt;&quot;4&amp;lt; %d %d %d %lu %s | %s %s %s %s &amp;gt; &quot;&lt;/span&gt;
                          &lt;span class=&quot;code-quote&quot;&gt;&quot;5&amp;lt; %s %s %s %s | %d %s %s | %d %s %s&amp;gt;\n&quot;&lt;/span&gt;,
                          opg,
                          &lt;span class=&quot;code-comment&quot;&gt;/* 1 */&lt;/span&gt;
                          oap-&amp;gt;oap_magic, oap-&amp;gt;oap_cmd,
                          oap-&amp;gt;oap_interrupted,
                          osc_list(&amp;amp;oap-&amp;gt;oap_pending_item),
                          osc_list(&amp;amp;oap-&amp;gt;oap_urgent_item),
                          osc_list(&amp;amp;oap-&amp;gt;oap_rpc_item),
                          &lt;span class=&quot;code-comment&quot;&gt;/* 2 */&lt;/span&gt;
                          oap-&amp;gt;oap_obj_off, oap-&amp;gt;oap_page_off, oap-&amp;gt;oap_count,
                          oap-&amp;gt;oap_async_flags, oap-&amp;gt;oap_brw_flags,
                          oap-&amp;gt;oap_request,
                          oap-&amp;gt;oap_cli, oap-&amp;gt;oap_loi, oap-&amp;gt;oap_caller_ops,
                          oap-&amp;gt;oap_caller_data,
                          &lt;span class=&quot;code-comment&quot;&gt;/* 3 */&lt;/span&gt;
                          osc_list(&amp;amp;opg-&amp;gt;ops_inflight),
                          opg-&amp;gt;ops_submitter, opg-&amp;gt;ops_transfer_pinned,
                          osc_submit_duration(opg), opg-&amp;gt;ops_srvlock,
                          &lt;span class=&quot;code-comment&quot;&gt;/* 4 */&lt;/span&gt;
                          cli-&amp;gt;cl_r_in_flight, cli-&amp;gt;cl_w_in_flight,
                          cli-&amp;gt;cl_max_rpcs_in_flight,
                          cli-&amp;gt;cl_avail_grant,
                          osc_list(&amp;amp;cli-&amp;gt;cl_cache_waiters),
                          osc_list(&amp;amp;cli-&amp;gt;cl_loi_ready_list),
                          osc_list(&amp;amp;cli-&amp;gt;cl_loi_hp_ready_list),
                          osc_list(&amp;amp;cli-&amp;gt;cl_loi_write_list),
                          osc_list(&amp;amp;cli-&amp;gt;cl_loi_read_list),
                          &lt;span class=&quot;code-comment&quot;&gt;/* 5 */&lt;/span&gt;
                          osc_list(&amp;amp;loi-&amp;gt;loi_ready_item),
                          osc_list(&amp;amp;loi-&amp;gt;loi_hp_ready_item),
                          osc_list(&amp;amp;loi-&amp;gt;loi_write_item),
                          osc_list(&amp;amp;loi-&amp;gt;loi_read_item),
                          loi-&amp;gt;loi_read_lop.lop_num_pending,
                          osc_list(&amp;amp;loi-&amp;gt;loi_read_lop.lop_pending),
                          osc_list(&amp;amp;loi-&amp;gt;loi_read_lop.lop_urgent),
                          loi-&amp;gt;loi_write_lop.lop_num_pending,
                          osc_list(&amp;amp;loi-&amp;gt;loi_write_lop.lop_pending),
                          osc_list(&amp;amp;loi-&amp;gt;loi_write_lop.lop_urgent));
}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="43424" author="jay" created="Fri, 17 Aug 2012 13:33:35 +0000"  >&lt;p&gt;Hi Wojciech Turek, Thanks. It looks like the code mismatches the output from your first comment.&lt;/p&gt;

&lt;p&gt;BTW, you can use:&lt;/p&gt;

&lt;p&gt;{code} /* C code */ {code}&lt;/p&gt;

&lt;p&gt;to quote source code on jira.&lt;/p&gt;
</comment>
                            <comment id="43429" author="wjt27" created="Fri, 17 Aug 2012 14:33:37 +0000"  >&lt;p&gt;Hi Jinshan,&lt;/p&gt;

&lt;p&gt;I don&apos;t understand why you say it mismatches, can you elaborate please?&lt;/p&gt;</comment>
                            <comment id="43443" author="jay" created="Fri, 17 Aug 2012 17:06:51 +0000"  >&lt;p&gt;Maybe the output was truncated, from the output you posted:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Aug 8 16:00:02 sand-4-52 kernel: LustreError: 64082:0:(osc_page.c:425:osc_page_delete()) osc-page@ffff881067d54bc8: 1&amp;lt; 0x845fed 1 0 - - + &amp;gt; 2&amp;lt; 5173248 0 4096 0x0 0x8 | (null) ffff8806d7f24688 ffff88016958f700 ffffffffa07ff&amp;gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;only paragraph 1 &amp;lt;...&amp;gt; and 2 &amp;lt;...&amp;gt; were printed, but I expect to see all 5 paragraphs.&lt;/p&gt;

&lt;p&gt;How easy you can reproduce this problem, if possible can you please trigger it and post the output on jira again?&lt;/p&gt;
</comment>
                            <comment id="46509" author="green" created="Sat, 13 Oct 2012 12:28:19 +0000"  >&lt;p&gt;I just hit this running racer on a small local fs (That gets ENOSPC easily):&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[12126.733752] LustreError: 11222:0:(vvp_io.c:1038:vvp_io_commit_write()) Write page 0 of inode ffff88004431db20 failed -28
[12126.734303] LustreError: 11222:0:(vvp_io.c:1038:vvp_io_commit_write()) Skipped 708 previous similar messages
[12198.367486] LustreError: 26187:0:(osc_cache.c:2343:osc_teardown_async_page()) extent ffff88002223ef38@{[256 -&amp;gt; 402/511], [2|0|-|cache|wi|ffff880088af7eb0], [602112|147|+|-|ffff880032770ed8|256|(null)]} trunc at 256.
[12198.368328] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) page@ffff880011a6def0[2 ffff8800169d7f88:256 ^(null)_ffff8800868dfef0 4 0 1 (null) (null) 0x0]
[12198.369065] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) page@ffff8800868dfef0[1 ffff88004b855f98:256 ^ffff880011a6def0_(null) 4 0 1 (null) (null) 0x0]
[12198.369829] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) vvp-page@ffff88009f775af8(0:0:0) vm@ffffea00011fc5f8 20000000000035 2:0 0 256 lru
[12198.370386] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) lov-page@ffff880010cfbae8
[12198.370856] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) osc-page@ffff88008e13ef08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1048576 0 4096 0x0 0x520 | (null) ffff88006f5c8cb0 ffff880088af7eb0 &amp;gt; 3&amp;lt; + ffff880051112540 0 0 0 &amp;gt; 4&amp;lt; 0 0 8 35164160 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 147 - -&amp;gt;
[12198.371911] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) end page@ffff880011a6def0
[12198.372377] LustreError: 26187:0:(osc_page.c:411:osc_page_delete()) Trying to teardown failed: -16
[12198.372850] LustreError: 26187:0:(osc_page.c:412:osc_page_delete()) ASSERTION( 0 ) failed: 
[12198.373329] LustreError: 26187:0:(osc_page.c:412:osc_page_delete()) LBUG
[12198.373602] Pid: 26187, comm: ldlm_bl_21
[12198.373826] 
[12198.373827] Call Trace:
[12198.374850]  [&amp;lt;ffffffffa0caa915&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
[12198.375155]  [&amp;lt;ffffffffa0caaf27&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
[12198.375436]  [&amp;lt;ffffffffa04cec1d&amp;gt;] osc_page_delete+0x29d/0x2a0 [osc]
[12198.375752]  [&amp;lt;ffffffffa11d8e65&amp;gt;] cl_page_delete0+0xd5/0x500 [obdclass]
[12198.376052]  [&amp;lt;ffffffffa11d92d2&amp;gt;] cl_page_delete+0x42/0x120 [obdclass]
[12198.376357]  [&amp;lt;ffffffffa0ac37cd&amp;gt;] ll_invalidatepage+0x8d/0x180 [lustre]
[12198.376692]  [&amp;lt;ffffffffa0ad592f&amp;gt;] vvp_page_discard+0x9f/0x140 [lustre]
[12198.376989]  [&amp;lt;ffffffffa11d6358&amp;gt;] cl_page_invoid+0x78/0x170 [obdclass]
[12198.377307]  [&amp;lt;ffffffffa11d68a8&amp;gt;] ? cl_page_invoke+0x158/0x1c0 [obdclass]
[12198.377607]  [&amp;lt;ffffffffa11d6463&amp;gt;] cl_page_discard+0x13/0x20 [obdclass]
[12198.377903]  [&amp;lt;ffffffffa11e08ae&amp;gt;] check_and_discard_cb+0x13e/0x160 [obdclass]
[12198.378220]  [&amp;lt;ffffffffa11db54c&amp;gt;] cl_page_gang_lookup+0x1fc/0x410 [obdclass]
[12198.378527]  [&amp;lt;ffffffffa11e0770&amp;gt;] ? check_and_discard_cb+0x0/0x160 [obdclass]
[12198.378834]  [&amp;lt;ffffffffa11e0770&amp;gt;] ? check_and_discard_cb+0x0/0x160 [obdclass]
[12198.379144]  [&amp;lt;ffffffffa11de03e&amp;gt;] cl_lock_discard_pages+0x11e/0x1f0 [obdclass]
[12198.379607]  [&amp;lt;ffffffffa11d33d5&amp;gt;] ? cl_env_info+0x15/0x20 [obdclass]
[12198.379888]  [&amp;lt;ffffffffa04cfb80&amp;gt;] osc_lock_flush+0x110/0x200 [osc]
[12198.380167]  [&amp;lt;ffffffffa04cfcc9&amp;gt;] osc_lock_cancel+0x59/0x1a0 [osc]
[12198.380454]  [&amp;lt;ffffffffa11dbda5&amp;gt;] cl_lock_cancel0+0x75/0x160 [obdclass]
[12198.380752]  [&amp;lt;ffffffffa11dca0b&amp;gt;] cl_lock_cancel+0x13b/0x140 [obdclass]
[12198.381045]  [&amp;lt;ffffffffa04d19ba&amp;gt;] osc_ldlm_blocking_ast+0x13a/0x380 [osc]
[12198.381368]  [&amp;lt;ffffffffa12dbaf3&amp;gt;] ldlm_handle_bl_callback+0x123/0x2e0 [ptlrpc]
[12198.381831]  [&amp;lt;ffffffffa12dbf31&amp;gt;] ldlm_bl_thread_main+0x281/0x3e0 [ptlrpc]
[12198.382119]  [&amp;lt;ffffffff81057d60&amp;gt;] ? default_wake_function+0x0/0x20
[12198.382408]  [&amp;lt;ffffffffa12dbcb0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[12198.382692]  [&amp;lt;ffffffff8100c14a&amp;gt;] child_rip+0xa/0x20
[12198.382958]  [&amp;lt;ffffffffa12dbcb0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[12198.383826]  [&amp;lt;ffffffffa12dbcb0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[12198.384126]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
[12198.384378] 
[12198.455840] Kernel panic - not syncing: LBUG
[12198.456115] Pid: 26187, comm: ldlm_bl_21 Not tainted 2.6.32-debug #6
[12198.456423] Call Trace:
[12198.456632]  [&amp;lt;ffffffff814f75e4&amp;gt;] ? panic+0xa0/0x168
[12198.456887]  [&amp;lt;ffffffffa0caaf7b&amp;gt;] ? lbug_with_loc+0x9b/0xb0 [libcfs]
[12198.457201]  [&amp;lt;ffffffffa04cec1d&amp;gt;] ? osc_page_delete+0x29d/0x2a0 [osc]
[12198.457516]  [&amp;lt;ffffffffa11d8e65&amp;gt;] ? cl_page_delete0+0xd5/0x500 [obdclass]
[12198.457816]  [&amp;lt;ffffffffa11d92d2&amp;gt;] ? cl_page_delete+0x42/0x120 [obdclass]
[12198.458127]  [&amp;lt;ffffffffa0ac37cd&amp;gt;] ? ll_invalidatepage+0x8d/0x180 [lustre]
[12198.458420]  [&amp;lt;ffffffffa0ad592f&amp;gt;] ? vvp_page_discard+0x9f/0x140 [lustre]
[12198.458718]  [&amp;lt;ffffffffa11d6358&amp;gt;] ? cl_page_invoid+0x78/0x170 [obdclass]
[12198.459014]  [&amp;lt;ffffffffa11d68a8&amp;gt;] ? cl_page_invoke+0x158/0x1c0 [obdclass]
[12198.459328]  [&amp;lt;ffffffffa11d6463&amp;gt;] ? cl_page_discard+0x13/0x20 [obdclass]
[12198.459627]  [&amp;lt;ffffffffa11e08ae&amp;gt;] ? check_and_discard_cb+0x13e/0x160 [obdclass]
[12198.460126]  [&amp;lt;ffffffffa11db54c&amp;gt;] ? cl_page_gang_lookup+0x1fc/0x410 [obdclass]
[12198.460617]  [&amp;lt;ffffffffa11e0770&amp;gt;] ? check_and_discard_cb+0x0/0x160 [obdclass]
[12198.460970]  [&amp;lt;ffffffffa11e0770&amp;gt;] ? check_and_discard_cb+0x0/0x160 [obdclass]
[12198.462162]  [&amp;lt;ffffffffa11de03e&amp;gt;] ? cl_lock_discard_pages+0x11e/0x1f0 [obdclass]
[12198.462646]  [&amp;lt;ffffffffa11d33d5&amp;gt;] ? cl_env_info+0x15/0x20 [obdclass]
[12198.462932]  [&amp;lt;ffffffffa04cfb80&amp;gt;] ? osc_lock_flush+0x110/0x200 [osc]
[12198.463225]  [&amp;lt;ffffffffa04cfcc9&amp;gt;] ? osc_lock_cancel+0x59/0x1a0 [osc]
[12198.463533]  [&amp;lt;ffffffffa11dbda5&amp;gt;] ? cl_lock_cancel0+0x75/0x160 [obdclass]
[12198.463829]  [&amp;lt;ffffffffa11dca0b&amp;gt;] ? cl_lock_cancel+0x13b/0x140 [obdclass]
[12198.464120]  [&amp;lt;ffffffffa04d19ba&amp;gt;] ? osc_ldlm_blocking_ast+0x13a/0x380 [osc]
[12198.464436]  [&amp;lt;ffffffffa12dbaf3&amp;gt;] ? ldlm_handle_bl_callback+0x123/0x2e0 [ptlrpc]
[12198.464898]  [&amp;lt;ffffffffa12dbf31&amp;gt;] ? ldlm_bl_thread_main+0x281/0x3e0 [ptlrpc]
[12198.465240]  [&amp;lt;ffffffff81057d60&amp;gt;] ? default_wake_function+0x0/0x20
[12198.465533]  [&amp;lt;ffffffffa12dbcb0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[12198.465815]  [&amp;lt;ffffffff8100c14a&amp;gt;] ? child_rip+0xa/0x20
[12198.466084]  [&amp;lt;ffffffffa12dbcb0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[12198.466393]  [&amp;lt;ffffffffa12dbcb0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[12198.466699]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;I have vmcore for this occurence&lt;/p&gt;</comment>
                            <comment id="46810" author="jay" created="Sat, 20 Oct 2012 20:13:09 +0000"  >&lt;p&gt;duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2170&quot; title=&quot;osc_extent_merge()) ASSERTION( cur-&amp;gt;oe_osclock == victim-&amp;gt;oe_osclock) while running racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2170&quot;&gt;&lt;del&gt;LU-2170&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="47793" author="bkorb" created="Wed, 14 Nov 2012 12:01:36 +0000"  >&lt;p&gt;I am a little unclear as to how this was diagnosed as a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2170&quot; title=&quot;osc_extent_merge()) ASSERTION( cur-&amp;gt;oe_osclock == victim-&amp;gt;oe_osclock) while running racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2170&quot;&gt;&lt;del&gt;LU-2170&lt;/del&gt;&lt;/a&gt;.&lt;br/&gt;
The assertions are different.  This &quot;assert(0)&quot; was initiated because&lt;br/&gt;
osc_page_delete() was called while the opg-&amp;gt;ops_oap field referenced a&lt;br/&gt;
osc_async_page structure with a non-empty oap_rpc_item list.  (That caused&lt;br/&gt;
osc_teardown_async_page to return EBUSY (16) and osc_page_delete handles&lt;br/&gt;
that by asserting that zero is not zero.)&lt;/p&gt;

&lt;p&gt;So, I don&apos;t see the obvious reason the osc_extent_merge assertion would be&lt;br/&gt;
seen as a duplicate of this issue.&lt;/p&gt;</comment>
                            <comment id="47796" author="jay" created="Wed, 14 Nov 2012 13:21:04 +0000"  >&lt;p&gt;In &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2170&quot; title=&quot;osc_extent_merge()) ASSERTION( cur-&amp;gt;oe_osclock == victim-&amp;gt;oe_osclock) while running racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2170&quot;&gt;&lt;del&gt;LU-2170&lt;/del&gt;&lt;/a&gt;, I discovered that a write lock can be matched and enqueued by a glimpse process so that the write lock will be marked with INTENT(this write lock was wrongly converted to glimpse lock) in the enqueue RPC, then the lock was denied by OST, then the client calls cl_lock_delete() to delete this lock and grants cl_lock to make it go through with glimpse. After glimpse process finishes to use this lock, it will be deleted w/o canceling.&lt;/p&gt;

&lt;p&gt;Depending on the time when this lock is found by other process, difference symptoms will show up. For example, in osc_extent_merge(), I discovered that one of the extent&apos;s oe_lock pointed to that &quot;glimpse write&quot; lock, and another extent had the normal one. For the osc_page_delete() case, that was because one dirty page was added into the &quot;glimpse write&quot; lock, since there is no cancel for this lock, the page still remained in the cache after the lock was deleted. Afterwards, when a read lock was enqueued and canceled, it discovered this page and then hit the assert.&lt;/p&gt;</comment>
                            <comment id="47797" author="bkorb" created="Wed, 14 Nov 2012 13:49:56 +0000"  >&lt;p&gt;OK, well we (Cory at Cray) see the same symptom, even after the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2170&quot; title=&quot;osc_extent_merge()) ASSERTION( cur-&amp;gt;oe_osclock == victim-&amp;gt;oe_osclock) while running racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2170&quot;&gt;&lt;del&gt;LU-2170&lt;/del&gt;&lt;/a&gt; patch.&lt;br/&gt;
So there must be another cause for this.&lt;/p&gt;

&lt;p&gt;&amp;gt; Denis Kondratenko added a comment - 06/Nov/12 4:31 AM&lt;br/&gt;
&amp;gt; Wally,&lt;br/&gt;
&amp;gt; was this fixed by &lt;a href=&quot;http://jira.whamcloud.com/browse/LU-2170&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;http://jira.whamcloud.com/browse/LU-2170&lt;/a&gt; ?&lt;br/&gt;
&amp;gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;...&amp;#93;&lt;/span&gt;&lt;br/&gt;
&amp;gt; Wally Wang added a comment - 06/Nov/12 3:19 PM&lt;br/&gt;
&amp;gt; No, attached is the SP2 version of the cdump and it is with the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2170&quot; title=&quot;osc_extent_merge()) ASSERTION( cur-&amp;gt;oe_osclock == victim-&amp;gt;oe_osclock) while running racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2170&quot;&gt;&lt;del&gt;LU-2170&lt;/del&gt;&lt;/a&gt; applied.&lt;/p&gt;

&lt;p&gt;The SP2 version of the cdump was, unfortunately, corrupt, so I&apos;ve been futzing&lt;br/&gt;
with the pre-SP2 version.  That earlier dump may well have been caused by the&lt;br/&gt;
issue fixed in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2170&quot; title=&quot;osc_extent_merge()) ASSERTION( cur-&amp;gt;oe_osclock == victim-&amp;gt;oe_osclock) while running racer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2170&quot;&gt;&lt;del&gt;LU-2170&lt;/del&gt;&lt;/a&gt;, but the later dump not.  (Presuming Wally is correct about&lt;br/&gt;
the patch having been applied.)&lt;/p&gt;

&lt;p&gt;I can attach the SP2 console log, if you like.  But not the &quot;lctl dk&quot; dump,&lt;br/&gt;
pending another crash dump.&lt;/p&gt;</comment>
                            <comment id="47804" author="jay" created="Wed, 14 Nov 2012 15:02:46 +0000"  >&lt;p&gt;this is a different issue from what have described by Oleg&lt;/p&gt;</comment>
                            <comment id="47806" author="bkorb" created="Wed, 14 Nov 2012 15:25:43 +0000"  >&lt;p&gt;OK.  Thank you.  It just looks a lot alike.&lt;br/&gt;
I will keep reading code.&lt;/p&gt;

&lt;p&gt;2012-11-06T14:57:10.872333-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_cache.c:2367:osc_teardown_async_page()) extent ffff88060eedfe58@&lt;/p&gt;
{[23 -&amp;gt; 23/255], [2|0|-|cache|wi|ffff88020e18f8c8], [4096|1|+|-|ffff8801f9ed9c18|256| (null)]}
&lt;p&gt; trunc at 23.&lt;br/&gt;
2012-11-06T14:57:10.872389-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) page@ffff88080e8c8bc0&lt;span class=&quot;error&quot;&gt;&amp;#91;2 ffff88020cefad08:23 ^          (null)_ffff88080e8c8b00 4 0 1  (null)  (null) 0x0&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:10.902445-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) page@ffff88080e8c8b00&lt;span class=&quot;error&quot;&gt;&amp;#91;1 ffff88020d8c1f58:23 ^ffff88080e8c8bc0_          (null) 4 0 1  (null)  (null) 0x0&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:10.902494-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) vvp-page@ffff88080e8cf5a0(0:0:0) vm@ffffea001c6a99b8 e00000000000063 7:0 0 23 lru&lt;br/&gt;
2012-11-06T14:57:10.902508-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) lov-page@ffff8808050a7888&lt;br/&gt;
2012-11-06T14:57:10.958005-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) osc-page@ffff88080d78ed20: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 94208 0 4096 0x0 0x520 |           (null) ffff880804350700 ffff88020e18f8c8 &amp;gt; 3&amp;lt; + ffff8801f8f577b0 0 0 0 &amp;gt; 4&amp;lt; 0 0 8 33824768 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 1 - -&amp;gt;&lt;br/&gt;
2012-11-06T14:57:10.958049-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) end page@ffff88080e8c8bc0&lt;br/&gt;
2012-11-06T14:57:10.983504-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:411:osc_page_delete()) Trying to teardown failed: -16&lt;br/&gt;
2012-11-06T14:57:10.983536-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:412:osc_page_delete()) ASSERTION( 0 ) failed:&lt;br/&gt;
2012-11-06T14:57:10.983549-06:00 c0-0c1s6n0 LustreError: 5270:0:(osc_page.c:412:osc_page_delete()) LBUG&lt;br/&gt;
2012-11-06T14:57:10.983570-06:00 c0-0c1s6n0 Pid: 5270, comm: fsx-linux&lt;br/&gt;
2012-11-06T14:57:10.983582-06:00 c0-0c1s6n0 Call Trace:&lt;br/&gt;
2012-11-06T14:57:10.983605-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810063b1&amp;gt;&amp;#93;&lt;/span&gt; try_stack_unwind+0x161/0x1a0&lt;br/&gt;
2012-11-06T14:57:11.009114-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81004bf9&amp;gt;&amp;#93;&lt;/span&gt; dump_trace+0x89/0x440&lt;br/&gt;
2012-11-06T14:57:11.009138-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa014e887&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x57/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.009161-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa014ede7&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x47/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.009173-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0671d41&amp;gt;&amp;#93;&lt;/span&gt; osc_page_delete+0x2d1/0x2e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.034700-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa02b0095&amp;gt;&amp;#93;&lt;/span&gt; cl_page_delete0+0xd5/0x4e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.034737-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa02b04e2&amp;gt;&amp;#93;&lt;/span&gt; cl_page_delete+0x42/0x120 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.034762-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa07f2e2d&amp;gt;&amp;#93;&lt;/span&gt; ll_invalidatepage+0x8d/0x170 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.034774-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa07ea290&amp;gt;&amp;#93;&lt;/span&gt; ll_page_mkwrite+0x7c0/0x840 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-06T14:57:11.034820-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81107cb7&amp;gt;&amp;#93;&lt;/span&gt; __do_fault+0xe7/0x570&lt;br/&gt;
2012-11-06T14:57:11.034833-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811081e4&amp;gt;&amp;#93;&lt;/span&gt; handle_pte_fault+0xa4/0xcd0&lt;br/&gt;
2012-11-06T14:57:11.060561-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81108fbe&amp;gt;&amp;#93;&lt;/span&gt; handle_mm_fault+0x1ae/0x240&lt;br/&gt;
2012-11-06T14:57:11.060588-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81025471&amp;gt;&amp;#93;&lt;/span&gt; do_page_fault+0x191/0x410&lt;br/&gt;
2012-11-06T14:57:11.060600-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81301b5f&amp;gt;&amp;#93;&lt;/span&gt; page_fault+0x1f/0x30&lt;br/&gt;
2012-11-06T14:57:11.060647-06:00 c0-0c1s6n0 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000200422b3&amp;gt;&amp;#93;&lt;/span&gt; 0x200422b3&lt;br/&gt;
2012-11-06T14:57:11.060660-06:00 c0-0c1s6n0 Kernel panic - not syncing: LBUG&lt;/p&gt;</comment>
                            <comment id="47889" author="bkorb" created="Thu, 15 Nov 2012 18:19:31 +0000"  >&lt;p&gt;I don&apos;t see an obvious way to add attachments, so I&apos;ll x-clip and paste some of the log info.&lt;br/&gt;
NOTE: I used a script to edit the time into a format compatible with the console log.&lt;br/&gt;
This &lt;em&gt;is&lt;/em&gt; the &quot;lctl dk&quot; output.&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;2012-11-14T16-33-50.279302:3591:(client.c:1917:ptlrpc_expire_one_request()) @@@ Request  sent has timed out for sent delay: &lt;span class=&quot;error&quot;&gt;&amp;#91;sent 1352932423/real 0&amp;#93;&lt;/span&gt;  req@ffff88041df49c00 x1418650257981646/t0(0) o400-&amp;gt;lustre1-OST0003-osc-ffff88061d741400@53@gni:28/4 lens 224/224 e 0 to 1 dl 1352932430 ref 2 fl Rpc:XN/0/ffffffff rc 0/-1&lt;br/&gt;
2012-11-14T16-33-50.279320:3591:(import.c:167:ptlrpc_set_import_discon()) lustre1-OST0003-osc-ffff88061d741400: Connection to lustre1-OST0003 (at 53@gni) was lost; in progress operations using this service will wait for recovery to complete&lt;br/&gt;
2012-11-14T16-33-50.279328:3591:(import.c:177:ptlrpc_set_import_discon()) ffff880815628000 lustre1-OST0003_UUID: changing import state from FULL to DISCONN&lt;br/&gt;
2012-11-14T16-33-50.279331:3591:(import.c:415:ptlrpc_fail_import()) lustre1-OST0003_UUID: waking up pinger&lt;/p&gt;

&lt;p&gt;2012-11-14T16-34-06.389737:3567:(import.c:1137:ptlrpc_connect_interpret()) ffff880815628000 lustre1-OST0003_UUID: changing import state from CONNECTING to DISCONN&lt;br/&gt;
2012-11-14T16-34-06.389739:3567:(import.c:1183:ptlrpc_connect_interpret()) recovery of lustre1-OST0003_UUID on 53@gni failed (-110 (ETIMEDOUT))&lt;br/&gt;
2012-11-14T16-34-47.095297:3564:(gnilnd_conn.c:2152:kgnilnd_reaper_dgram_check()) GNILND_DGRAM_REQ datagram to 42@gni timed out @ 63s dgram 0xffff880814862288 state GNILND_DGRAM_POSTED conn 0xffff880815013400&lt;/p&gt;

&lt;p&gt;2012-11-14T16-37-35.377578:3567:(import.c:815:ptlrpc_connect_interpret()) lustre1-MDT0000-mdc-ffff88061d741400: connect to target with instance 4&lt;br/&gt;
2012-11-14T16-37-35.377583:3567:(import.c:965:ptlrpc_connect_interpret()) @@@ lustre1-MDT0000-mdc-ffff88061d741400: evicting (reconnect/recover flags not set: 4)  req@ffff88041dd58000 x1418650257981665/t0(0) o38-&amp;gt;lustre1-MDT0000-mdc-ffff88061d741400@52@gni:12/10 lens 400/264 e 0 to 0 dl 1352932681 ref 1 fl Interpret:RN/0/0 rc 0/0&lt;br/&gt;
2012-11-14T16-37-35.377589:3567:(import.c:968:ptlrpc_connect_interpret()) ffff8808153cb000 lustre1-MDT0000_UUID: changing import state from CONNECTING to EVICTED&lt;/p&gt;

&lt;p&gt;2012-11-14T16-37-42.798033:3567:(lcommon_misc.c:77:cl_init_ea_size()) updating max_mdsize/max_cookiesize: 120/128&lt;br/&gt;
2012-11-14T16-37-42.798035:3567:(import.c:965:ptlrpc_connect_interpret()) @@@ lustre1-OST0003-osc-ffff88061d741400: evicting (reconnect/recover flags not set: 4)  req@ffff88081df80c00 x1418650257981674/t0(0) o8-&amp;gt;lustre1-OST0003-osc-ffff88061d741400@53@gni:28/4 lens 400/264 e 0 to 0 dl 1352932683 ref 1 fl Interpret:RN/0/0 rc 0/0&lt;br/&gt;
2012-11-14T16-37-42.798040:3567:(import.c:968:ptlrpc_connect_interpret()) ffff880815628000 lustre1-OST0003_UUID: changing import state from CONNECTING to EVICTED&lt;br/&gt;
2012-11-14T16-37-42.798043:3567:(import.c:1324:ptlrpc_import_recovery_state_machine()) 167-0: This client was evicted by lustre1-OST0003; in progress operations using this service will fail.&lt;br/&gt;
2012-11-14T16-37-42.798044:3567:(import.c:1328:ptlrpc_import_recovery_state_machine()) evicted from lustre1-OST0003_UUID@53@gni; invalidating&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;The connection recovers, according to logs:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;2012-11-14T16-37-42.798209:3867:(import.c:1394:ptlrpc_import_recovery_state_machine()) ffff8808155b6000 lustre1-OST0001_UUID: changing import state from RECOVER to FULL&lt;br/&gt;
2012-11-14T16-37-42.798211:3867:(lov_obd.c:431:lov_set_osc_active()) Marking OSC lustre1-OST0001_UUID active&lt;br/&gt;
2012-11-14T16-37-42.798213:3867:(lcommon_misc.c:77:cl_init_ea_size()) updating max_mdsize/max_cookiesize: 144/128&lt;br/&gt;
2012-11-14T16-37-42.798216:3867:(import.c:1402:ptlrpc_import_recovery_state_machine()) lustre1-OST0001-osc-ffff88061d741400: Connection restored to lustre1-OST0001 (at 53@gni)&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;Then about 400,000 copies of this:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;2012-11-14T16-41-29.357283:3941:(mdc_request.c:836:mdc_close()) @@@ matched open  req@ffff88081542e800 x1418650258369942/t17185315789(17185315789) o101-&amp;gt;lustre1-MDT0000-mdc-ffff88061d741400@52@gni:12/10 lens 560/600 e 0 to 0 dl 1352932906 ref 2 fl Complete:RP/4/0 rc 301/301&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;followed 0.2 seconds with the LBUG:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;2012-11-14T17-22-00.230715:2496:(osc_cache.c:2367:osc_teardown_async_page()) extent ffff88060ba76480@&lt;/p&gt;
&lt;div class=&quot;error&quot;&gt;&lt;span class=&quot;error&quot;&gt;Unknown macro: {[13 -&amp;gt; 13/255], [2|0|-|cache|wi|ffff8802054a9648], [4096|1|+|-|ffff8802172f9318|256|(null)]}&lt;/span&gt; &lt;/div&gt;
&lt;p&gt; trunc at 13.&lt;br/&gt;
2012-11-14T17-22-00.247868:2496:(osc_page.c:411:osc_page_delete()) page@ffff880403fcbcc0&lt;span class=&quot;error&quot;&gt;&amp;#91;2 ffff8802164aa948:13 ^(null)_ffff880403fcb840 4 0 1 (null) (null) 0x1&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-14T17-22-00.260922:2496:(osc_page.c:411:osc_page_delete()) page@ffff880403fcb840&lt;span class=&quot;error&quot;&gt;&amp;#91;1 ffff880207a317d8:13 ^ffff880403fcbcc0_(null) 4 0 1 (null) (null) 0x0&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-11-14T17-22-00.273976:2496:(osc_page.c:411:osc_page_delete()) vvp-page@ffff880401be3320(1:1:0) vm@ffffea000e052f28 6000000000000eb 9:0 0 13 lru&lt;br/&gt;
2012-11-14T17-22-00.285984:2496:(osc_page.c:411:osc_page_delete()) lov-page@ffff8803ea750798&lt;br/&gt;
2012-11-14T17-22-00.293128:2496:(osc_page.c:411:osc_page_delete()) osc-page@ffff880415ce6660: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 53248 0 4096 0x0 0x520 | (null) ffff8808155c65f8 ffff8802054a9648 &amp;gt; 3&amp;lt; + ffff8801f01cb040 0 0 0 &amp;gt; 4&amp;lt; 0 0 8 34373632 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 16 - -&amp;gt;&lt;br/&gt;
2012-11-14T17-22-00.316352:2496:(osc_page.c:411:osc_page_delete()) end page@ffff880403fcbcc0&lt;br/&gt;
2012-11-14T17-22-00.323489:2496:(osc_page.c:411:osc_page_delete()) Trying to teardown failed: -16&lt;br/&gt;
2012-11-14T17-22-00.331062:2496:(osc_page.c:412:osc_page_delete()) ASSERTION( 0 ) failed: &lt;br/&gt;
2012-11-14T17-22-00.338026:2496:(osc_page.c:412:osc_page_delete()) LBUG&lt;br/&gt;
2012-11-14T17-22-00.412653:2496:(linux-debug.c:143:libcfs_run_upcall()) Invoked LNET upcall /usr/lib/lustre/lnet_upcall LBUG,/usr/src/packages/BUILD/cray-lustre-2.3/lustre/osc/osc_page.c,osc_page_delete,412&lt;/p&gt;&lt;/blockquote&gt;</comment>
                            <comment id="48615" author="bkorb" created="Fri, 30 Nov 2012 14:48:14 +0000"  >&lt;p&gt;Here is an xz compressed &quot;dk&quot; log from a crash dump that is an example of the issue.  The two processes 617 and 619 are at issue.  There is a timing hole of some sort.  I will append Shadow&apos;s and my analysis shortly.&lt;/p&gt;</comment>
                            <comment id="48618" author="bkorb" created="Fri, 30 Nov 2012 14:55:04 +0000"  >&lt;p&gt;With a crash dump with debug tracing turned on, we get a lot more useful information.&lt;/p&gt;

&lt;p&gt;Alexey Lyashkov added a comment - 30/Nov/12 12:27 AM&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;In fact that is bug in new osc extent code landed into 2.3 :/
both code path
1) ldlm lock cancel -&amp;gt; page discard ....
and
2) mkwrite /race/ -&amp;gt; invalidate page

forget to find a extent and set correct state for it.  looks osc
extent author forget about forced page flush from a page cache with
mkwrite race and client eviction.

for first case that is more or less clear - cl_lock_discard_pages
foget to find an extent and set truncate state, because use a old API
and directly kill a pages. that is may be fixed via replace
cl_lock_discard_pages [with a] osc_extent_truncate_start or something
similar.

but for second case it&apos;s not clear for me. [It] looks [like] we need
[to] completely change code near of mkwrite and page invalidation.

[Otherwise] (may be dirty hack) - we change osc_page_delete to ignore
error in osc_teardown_async_page for some &apos;force&apos; cases or (better)
correctly abort an IO request for that page if page discard need (page
may be in readahead as was in
790798-osc_page_delete-assert0-sp1-1120-fulldbg.tar.bz2).&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="48893" author="bkorb" created="Fri, 7 Dec 2012 00:10:44 +0000"  >&lt;p&gt;More comments on Xyratex bug.  Given the difficulty/complexity of the change, I would happily accept guidance here.  (i.e. wait for you-all or suggestions on how to proceed)&lt;/p&gt;

&lt;p&gt;Iurii Golovach added a comment - 06/Dec/12 4:34 AM&lt;/p&gt;

&lt;p&gt;During implementation of extents on OSC level, two cases fell between cracks:&lt;/p&gt;

&lt;ul&gt;
	&lt;li&gt;evict;&lt;/li&gt;
	&lt;li&gt;invalidate page.&lt;br/&gt;
Like a result extent flags for these cases weren&apos;t set and we have a race.&lt;/li&gt;
&lt;/ul&gt;


&lt;p&gt;Since adding these cases is quite complex task we recommend to do next:&lt;br/&gt;
1) revert changes from next patches:&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/#change,2270&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,2270&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/#change,2009&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,2009&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/#change,2460&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,2460&lt;/a&gt;&lt;br/&gt;
2) wait until Jinshan finish his work on &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1723&quot; title=&quot;osc_page_delete()) ASSERTION(0) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1723&quot;&gt;&lt;del&gt;LU-1723&lt;/del&gt;&lt;/a&gt; and then use changes with correct extents support.&lt;/p&gt;

&lt;p&gt;Please let us know if you need patch against 2.3 to reverse these patches.&lt;/p&gt;

&lt;p&gt;Cory Spitz added a comment - 06/Dec/12 2:42 PM&lt;/p&gt;

&lt;p&gt;Hi, that&apos;s a pretty big change. How many bug fixes would we loose? I&apos;m not sure that the tradeoff for this bug is worth it (yet). Can you guys help w/&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1723&quot; title=&quot;osc_page_delete()) ASSERTION(0) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1723&quot;&gt;&lt;del&gt;LU-1723&lt;/del&gt;&lt;/a&gt; or are you just waiting for him?&lt;/p&gt;</comment>
                            <comment id="49460" author="bkorb" created="Wed, 19 Dec 2012 12:44:42 +0000"  >&lt;p&gt;In today&apos;s Xyratex/Cray conference call, it was decided to go forward with backing out the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1030&quot; title=&quot;new IO engine&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1030&quot;&gt;&lt;del&gt;LU-1030&lt;/del&gt;&lt;/a&gt; patches from our release branch, pending further work on them.&lt;/p&gt;</comment>
                            <comment id="49465" author="spitzcor" created="Wed, 19 Dec 2012 16:23:36 +0000"  >&lt;p&gt;I think that this should be a 2.4 release blocker.&lt;/p&gt;</comment>
                            <comment id="49624" author="green" created="Sun, 23 Dec 2012 13:31:52 +0000"  >&lt;p&gt;Hm, I think I just hit this issue on my burn-in cluster as well:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[56349.656614] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800805c6f08[3 ffff88000bf11f80:256 ^(null)_ffff880014be0f08 0 0 1 (null) (null) 0x0]
[56349.657354] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880014be0f08[2 ffff88002a8ecf98:256 ^ffff8800805c6f08_(null) 0 0 1 (null) (null) 0x0]
[56349.658145] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88006e65eb60(0:0:0) vm@ffffea00021b5a58 2000000000083c 2:0 ffff8800805c6f08 256 lru
[56349.658890] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff88002510ee00
[56349.659360] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff880062170f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1048576 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.660491] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff8800805c6f08
[56349.660996] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.661284] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880014be1f08[3 ffff88000bf11f80:257 ^(null)_ffff88001333ef08 0 0 1 (null) (null) 0x0]
[56349.662042] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff88001333ef08[2 ffff88002a8ecf98:257 ^ffff880014be1f08_(null) 0 0 1 (null) (null) 0x0]
[56349.662802] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88006e65ebc8(0:0:0) vm@ffffea0001cef2d0 2000000000083c 2:0 ffff880014be1f08 257 lru
[56349.663548] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff88002510e620
[56349.664016] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff88002b782f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1052672 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.665336] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff880014be1f08
[56349.665805] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.666679] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880093a26f08[3 ffff88000bf11f80:258 ^(null)_ffff88003c596f08 0 0 1 (null) (null) 0x0]
[56349.667419] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff88003c596f08[2 ffff88002a8ecf98:258 ^ffff880093a26f08_(null) 0 0 1 (null) (null) 0x0]
[56349.668166] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88006e65ec30(0:0:0) vm@ffffea0002285560 2000000000083c 2:0 ffff880093a26f08 258 lru
[56349.668917] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff88002510ece0
[56349.669389] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff88005bf32f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1056768 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.671402] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff880093a26f08
[56349.671883] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.672186] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800304a3f08[3 ffff88000bf11f80:259 ^(null)_ffff880032388f08 0 0 1 (null) (null) 0x0]
[56349.672953] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880032388f08[2 ffff88002a8ecf98:259 ^ffff8800304a3f08_(null) 0 0 1 (null) (null) 0x0]
[56349.673667] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88006e65ec98(0:0:0) vm@ffffea0001d40e80 2000000000083c 2:0 ffff8800304a3f08 259 lru
[56349.674403] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff8800740957d0
[56349.674898] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff8800922cff08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1060864 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.676000] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff8800304a3f08
[56349.676500] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.676872] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800304a2f08[3 ffff88000bf11f80:260 ^(null)_ffff8800639baf08 0 0 1 (null) (null) 0x0]
[56349.677605] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800639baf08[2 ffff88002a8ecf98:260 ^ffff8800304a2f08_(null) 0 0 1 (null) (null) 0x0]
[56349.678374] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88006e65ed00(0:0:0) vm@ffffea0002114048 2000000000083c 2:0 ffff8800304a2f08 260 lru
[56349.679110] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff880074095c98
[56349.679560] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff880081cf0f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1064960 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.680665] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff8800304a2f08
[56349.681134] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.681428] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800639bbf08[3 ffff88000bf11f80:261 ^(null)_ffff8800223a9f08 0 0 1 (null) (null) 0x0]
[56349.682160] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800223a9f08[2 ffff88002a8ecf98:261 ^ffff8800639bbf08_(null) 0 0 1 (null) (null) 0x0]
[56349.682893] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88006e65ed68(0:0:0) vm@ffffea000218f5a0 2000000000083c 2:0 ffff8800639bbf08 261 lru
[56349.683625] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff880074095ce0
[56349.684092] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff88001309df08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1069056 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.685177] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff8800639bbf08
[56349.685623] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.685921] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800223a8f08[3 ffff88000bf11f80:262 ^(null)_ffff8800248a3f08 0 0 1 (null) (null) 0x0]
[56349.686682] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800248a3f08[2 ffff88002a8ecf98:262 ^ffff8800223a8f08_(null) 0 0 1 (null) (null) 0x0]
[56349.687427] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88002d0ee0d0(0:0:0) vm@ffffea0001f0b178 2000000000083c 2:0 ffff8800223a8f08 262 lru
[56349.688184] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff880074095ae8
[56349.688665] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff88008e200f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1073152 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.689748] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff8800223a8f08
[56349.690214] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.690501] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880075c2ef08[3 ffff88000bf11f80:263 ^(null)_ffff880033ee2f08 0 0 1 (null) (null) 0x0]
[56349.691237] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880033ee2f08[2 ffff88002a8ecf98:263 ^ffff880075c2ef08_(null) 0 0 1 (null) (null) 0x0]
[56349.691967] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88002d0ee4e0(0:0:0) vm@ffffea00020fec90 2000000000083c 2:0 ffff880075c2ef08 263 lru
[56349.692706] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff880074095aa0
[56349.693172] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff880093ce0f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1077248 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.694248] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff880075c2ef08
[56349.694717] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.695010] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880033ee3f08[3 ffff88000bf11f80:264 ^(null)_ffff880061765f08 0 0 1 (null) (null) 0x0]
[56349.696293] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff880061765f08[2 ffff88002a8ecf98:264 ^ffff880033ee3f08_(null) 0 0 1 (null) (null) 0x0]
[56349.697945] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88002d0eea90(0:0:0) vm@ffffea0001f481f8 2000000000083c 2:0 ffff880033ee3f08 264 lru
[56349.698697] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff880074095740
[56349.699176] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff8800794ccf08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1081344 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.700246] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff880033ee3f08
[56349.700732] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.701026] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff8800393f6f08[3 ffff88000bf11f80:265 ^(null)_ffff88008b6e9f08 0 0 1 (null) (null) 0x0]
[56349.701758] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) page@ffff88008b6e9f08[2 ffff88002a8ecf98:265 ^ffff8800393f6f08_(null) 0 0 1 (null) (null) 0x0]
[56349.702492] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) vvp-page@ffff88002d0eec30(0:0:0) vm@ffffea000277cc78 2000000000083c 2:0 ffff8800393f6f08 265 lru
[56349.703850] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) lov-page@ffff880074095110
[56349.704321] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) osc-page@ffff88006b098f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1085440 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 1 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.705396] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) end page@ffff8800393f6f08
[56349.706003] LustreError: 20323:0:(osc_io.c:364:trunc_check_cb()) exists 0/cp.
[56349.758028] LustreError: 20323:0:(osc_cache.c:2370:osc_teardown_async_page()) extent ffff88006e1f1f38@{[256 -&amp;gt; 506/511], [2|0|-|cache|wi|ffff880078590eb0], [1028096|251|+|-|ffff88002b60ced8|256|(null)]} trunc at 256.
[56349.759172] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) page@ffff8800805c6f08[2 ffff88000bf11f80:256 ^(null)_ffff880014be0f08 4 0 1 (null) (null) 0x0]
[56349.759981] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) page@ffff880014be0f08[2 ffff88002a8ecf98:256 ^ffff8800805c6f08_(null) 4 0 1 (null) (null) 0x0]
[56349.760931] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) vvp-page@ffff88006e65eb60(0:0:0) vm@ffffea00021b5a58 20000000000035 3:0 0 256 lru
[56349.761537] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) lov-page@ffff88002510ee00
[56349.762131] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) osc-page@ffff880062170f08: 1&amp;lt; 0x845fed 258 0 + - &amp;gt; 2&amp;lt; 1048576 0 4096 0x0 0x520 | (null) ffff88007d410cf0 ffff880078590eb0 &amp;gt; 3&amp;lt; + ffff88006fc50140 0 0 0 &amp;gt; 4&amp;lt; 0 0 8 20480 - | - - + - &amp;gt; 5&amp;lt; - - + - | 0 - | 251 - -&amp;gt;
[56349.763222] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) end page@ffff8800805c6f08
[56349.763780] LustreError: 20323:0:(osc_page.c:431:osc_page_delete()) Trying to teardown failed: -16
[56349.764587] LustreError: 20323:0:(osc_page.c:432:osc_page_delete()) ASSERTION( 0 ) failed: 
[56349.765113] LustreError: 20323:0:(osc_page.c:432:osc_page_delete()) LBUG
[56349.765406] Pid: 20323, comm: cp
[56349.765648] 
[56349.765648] Call Trace:
[56349.766258]  [&amp;lt;ffffffffa0405915&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
[56349.766719]  [&amp;lt;ffffffffa0405f27&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
[56349.767070]  [&amp;lt;ffffffffa09bd5dd&amp;gt;] osc_page_delete+0x32d/0x330 [osc]
[56349.767381]  [&amp;lt;ffffffffa05d6b15&amp;gt;] cl_page_delete0+0xc5/0x510 [obdclass]
[56349.767713]  [&amp;lt;ffffffffa05d6fa2&amp;gt;] cl_page_delete+0x42/0x120 [obdclass]
[56349.768192]  [&amp;lt;ffffffffa0e4025d&amp;gt;] ll_invalidatepage+0x8d/0x180 [lustre]
[56349.768623]  [&amp;lt;ffffffff81129ee8&amp;gt;] do_invalidatepage+0x28/0x30
[56349.768950]  [&amp;lt;ffffffff8112a102&amp;gt;] truncate_inode_page+0xa2/0xc0
[56349.769216]  [&amp;lt;ffffffff8112a42a&amp;gt;] truncate_inode_pages_range+0x15a/0x460
[56349.769515]  [&amp;lt;ffffffff8112a745&amp;gt;] truncate_inode_pages+0x15/0x20
[56349.769877]  [&amp;lt;ffffffff8112a797&amp;gt;] truncate_pagecache+0x47/0x70
[56349.770297]  [&amp;lt;ffffffff8112a7d9&amp;gt;] truncate_setsize+0x19/0x20
[56349.770657]  [&amp;lt;ffffffff8112a81e&amp;gt;] vmtruncate+0x3e/0x70
[56349.771010]  [&amp;lt;ffffffffa0e53a53&amp;gt;] vvp_io_setattr_end+0x63/0x80 [lustre]
[56349.771349]  [&amp;lt;ffffffffa05dec60&amp;gt;] cl_io_end+0x60/0x150 [obdclass]
[56349.771769]  [&amp;lt;ffffffffa05e3d82&amp;gt;] cl_io_loop+0xc2/0x1b0 [obdclass]
[56349.772084]  [&amp;lt;ffffffffa0e4c448&amp;gt;] cl_setattr_ost+0x208/0x2d0 [lustre]
[56349.772389]  [&amp;lt;ffffffffa0e1c122&amp;gt;] ll_setattr_raw+0x792/0xfb0 [lustre]
[56349.772706]  [&amp;lt;ffffffffa0e1c99b&amp;gt;] ll_setattr+0x5b/0xf0 [lustre]
[56349.772987]  [&amp;lt;ffffffff81197688&amp;gt;] notify_change+0x168/0x340
[56349.773252]  [&amp;lt;ffffffff81179af4&amp;gt;] do_truncate+0x64/0xa0
[56349.773530]  [&amp;lt;ffffffff8118c309&amp;gt;] do_filp_open+0x829/0xd90
[56349.773854]  [&amp;lt;ffffffff8118827b&amp;gt;] ? getname+0x3b/0x250
[56349.774277]  [&amp;lt;ffffffff81044f4e&amp;gt;] ? kernel_map_pages+0xfe/0x110
[56349.774708]  [&amp;lt;ffffffff8119861b&amp;gt;] ? alloc_fd+0xab/0x160
[56349.775166]  [&amp;lt;ffffffff81178839&amp;gt;] do_sys_open+0x69/0x140
[56349.775569]  [&amp;lt;ffffffff81178950&amp;gt;] sys_open+0x20/0x30
[56349.775968]  [&amp;lt;ffffffff8100b0f2&amp;gt;] system_call_fastpath+0x16/0x1b
[56349.776371] 
[56349.777741] Kernel panic - not syncing: LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;vmcore and modules are in /exports/crashdumps/192.168.10.218-2012-12-23-08:15:29&lt;/p&gt;</comment>
                            <comment id="49690" author="jay" created="Wed, 26 Dec 2012 18:58:44 +0000"  >&lt;p&gt;Hi Oleg, please file a new bug for this because it seems like a new issue.&lt;/p&gt;

&lt;p&gt;From the stacktrace and crashdump, an extent was not truncated by osc_cache_truncate_start() somehow.&lt;/p&gt;</comment>
                            <comment id="49852" author="bkorb" created="Wed, 2 Jan 2013 16:46:28 +0000"  >&lt;p&gt;Since this was filed against 2.1.2 and the problem we are trying to deal with only occurs on the 2.3 source base, we have opened a new bug report:  &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2557&quot; title=&quot;osc_page_delete()) Trying to teardown failed: -16 (EBUSY)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2557&quot;&gt;&lt;del&gt;LU-2557&lt;/del&gt;&lt;/a&gt;.  It shows exactly the symptom Oleg displayed above, which is the same as my comment from November:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://jira.whamcloud.com/browse/LU-1723?focusedCommentId=47889&amp;amp;page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel#comment-47889&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;http://jira.whamcloud.com/browse/LU-1723?focusedCommentId=47889&amp;amp;page=com.atlassian.jira.plugin.system.issuetabpanels:comment-tabpanel#comment-47889&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="197406" author="adilger" created="Mon, 29 May 2017 04:57:26 +0000"  >&lt;p&gt;Close old ticket.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                                        </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="12075" name="dk.log.xz" size="4317440" author="bkorb" created="Fri, 30 Nov 2012 14:48:14 +0000"/>
                            <attachment id="11762" name="lustre-log.1344438003.64082.tar.bz2" size="781297" author="wjt27" created="Wed, 8 Aug 2012 11:32:09 +0000"/>
                            <attachment id="11763" name="sand-4-52_lustre_debug.log" size="5044" author="wjt27" created="Wed, 8 Aug 2012 11:32:09 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10490" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>End date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Wed, 2 Jan 2013 11:32:09 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzv46n:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>4210</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10493" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>Start date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Wed, 8 Aug 2012 11:32:09 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                    </customfields>
    </item>
</channel>
</rss>