<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:20:04 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1831] filter_direct_io()) ASSERTION( iobuf-&gt;dr_npages &gt; 0 ) </title>
                <link>https://jira.whamcloud.com/browse/LU-1831</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Lustre: DEBUG MARKER: == sanityn test 15: test out-of-space with multiple writers ========================================== 18:15:33 (1346854533)&lt;br/&gt;
LustreError: 7743:0:(filter_io_26.c:484:filter_direct_io()) ASSERTION( iobuf-&amp;gt;dr_npages &amp;gt; 0 ) failed: &lt;br/&gt;
LustreError: 7743:0:(filter_io_26.c:484:filter_direct_io()) LBUG&lt;br/&gt;
Pid: 7743, comm: ll_ost_io01_002&lt;/p&gt;

&lt;p&gt;Call Trace:&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000dfd5b7a1&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x51/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000dfd5bf7b&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x3b/0xa0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000e0e6e437&amp;gt;&amp;#93;&lt;/span&gt; filter_do_bio+0x21c7/0x2a00 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000e0e7001f&amp;gt;&amp;#93;&lt;/span&gt; filter_commitrw_write+0x13af/0x5010 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000dfd5ccd3&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_alloc+0x23/0xf0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000c109ea7a&amp;gt;&amp;#93;&lt;/span&gt; ? cache_alloc_debugcheck_after.isra.40+0xca/0x180&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000dfd5ccd3&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_alloc+0x23/0xf0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000c109ed85&amp;gt;&amp;#93;&lt;/span&gt; ? __kmalloc+0xb5/0x1a0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000c10876a0&amp;gt;&amp;#93;&lt;/span&gt; ? kzfree+0x30/0xc0&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000e0e623fc&amp;gt;&amp;#93;&lt;/span&gt; filter_commitrw+0x29c/0x340 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000c13daa38&amp;gt;&amp;#93;&lt;/span&gt; ? _spin_unlock+0x8/0x10&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000dff2ec4c&amp;gt;&amp;#93;&lt;/span&gt; ? lprocfs_counter_add+0x14c/0x1e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lvfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;00000000e029443f&amp;gt;&amp;#93;&lt;/span&gt; ost_brw_write+0x17fd/0x22e2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;/p&gt;</description>
                <environment>local testing in vbox</environment>
        <key id="15691">LU-1831</key>
            <summary>filter_direct_io()) ASSERTION( iobuf-&gt;dr_npages &gt; 0 ) </summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="hongchao.zhang">Hongchao Zhang</assignee>
                                    <reporter username="bzzz">Alex Zhuravlev</reporter>
                        <labels>
                    </labels>
                <created>Wed, 5 Sep 2012 10:16:28 +0000</created>
                <updated>Mon, 10 Sep 2012 02:54:30 +0000</updated>
                            <resolved>Mon, 10 Sep 2012 02:54:30 +0000</resolved>
                                    <version>Lustre 2.3.0</version>
                    <version>Lustre 2.4.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="44196" author="adilger" created="Wed, 5 Sep 2012 10:59:29 +0000"  >&lt;p&gt;I&apos;m also able to hit this problem 100% of the time on my single-node testing system (real hardware), though I see it at the end of racer.sh when it is trying to unmount the filesystem.&lt;/p&gt;

&lt;p&gt;My first guess would be some recent change in either the RHEL 6.3 kernel bio layer which is breaking the assumption of this code, or a recent modification to nearby code. This code itself has been around for a very long time and I only started seeing the problem with the update to RHEL 6.3, but there was a window of 2 months or so where I didn&apos;t run any tests locally because the ldiskfs patches would build against the RHEL 6.2 kernel I had installed. &lt;/p&gt;

&lt;p&gt;I can make the node available for remote debugging if that is needed. However, it isn&apos;t ideal for a bug which crashes the node, since it cannot reboot automatically. &lt;/p&gt;</comment>
                            <comment id="44197" author="bzzz" created="Wed, 5 Sep 2012 11:01:41 +0000"  >&lt;p&gt;I hit this quite often and can help to collect data.&lt;/p&gt;</comment>
                            <comment id="44202" author="jay" created="Wed, 5 Sep 2012 11:33:55 +0000"  >&lt;p&gt;Besides this problem I also saw the module refcount of obdfilter is 2 after unmounting all OST targets.&lt;/p&gt;</comment>
                            <comment id="44282" author="pjones" created="Thu, 6 Sep 2012 09:43:27 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="44316" author="adilger" created="Thu, 6 Sep 2012 15:33:26 +0000"  >&lt;p&gt;I checked &lt;tt&gt;git log lustre/obdfilter/filter_io.c&lt;/tt&gt; for changes that had been made recently to that code, and found the following commits:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;commit 859e5b2d20552f8df0ed2afda0f1a7c3c7d86678
Author: Hongchao Zhang &amp;lt;hongchao.zhang@whamcloud.com&amp;gt;
Date:   Mon Aug 20 15:40:48 2012 +0800

    LU-657 obdfilter: fix bug in previous patch
    
    in the merged patch http://review.whamcloud.com/#change,3446,
    the usage of fsfilt_commit_wait is wrong, and it doesn&apos;t stop
    the journal firstly.
    
    Change-Id: I3a36edf7049466880c27c14bb7f99966aa75d4f1
    Reviewed-on: http://review.whamcloud.com/3692

commit a9597791b658ff51474c06f419162d0a0bf03c65
Author: Hongchao Zhang &amp;lt;hongchao.zhang@whamcloud.com&amp;gt;
Date:   Tue Aug 7 08:43:11 2012 +0800

    LU-657 obdfilter: commit pending journals if -ENOSPC
    
    in filter_preprw_write, if there is no enough space for this
    write operation, then commit the pending journals to get some
    more disk space and retry it.
    
    Change-Id: I46106b26443bb203eee6f01a0795b47be09170a6
    Reviewed-on: http://review.whamcloud.com/3446
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Reverting these two patches has allowed me to pass both racer.sh and sanityn.sh test_15 (OOS), which failed for me this morning.&lt;/p&gt;

&lt;p&gt;I suspect there is some kind of refcount problem in the retry code from this patch, and it is only hit when the new code is active when filesystem is nearly out of space.&lt;/p&gt;</comment>
                            <comment id="44317" author="pjones" created="Thu, 6 Sep 2012 15:48:33 +0000"  >&lt;p&gt;Hongchao&lt;/p&gt;

&lt;p&gt;Could you please look into this?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="44476" author="adilger" created="Mon, 10 Sep 2012 02:54:30 +0000"  >&lt;p&gt;This looks like a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1824&quot; title=&quot;Test failure on test suite obdfilter-survey, subtest test_2a&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1824&quot;&gt;&lt;del&gt;LU-1824&lt;/del&gt;&lt;/a&gt;, which Yu Jian is already working on, and has a patch in &lt;a href=&quot;http://review.whamcloud.com/3913&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/3913&lt;/a&gt; ready for inspection.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="15676">LU-1824</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvglr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6339</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>