<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:37:57 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-3906] Failure on test suite parallel-scale test_compilebench: IOError, No space left on device</title>
                <link>https://jira.whamcloud.com/browse/LU-3906</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/70ec74de-15b9-11e3-8938-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/70ec74de-15b9-11e3-8938-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;client console shows:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;11:00:39:Lustre: DEBUG MARKER: == parallel-scale test compilebench: compilebench == 11:00:31 (1378317631)
11:00:39:Lustre: DEBUG MARKER: /usr/sbin/lctl mark free space=1194928, reducing initial dirs to 1
11:00:40:Lustre: DEBUG MARKER: free space=1194928, reducing initial dirs to 1
11:00:40:Lustre: DEBUG MARKER: /usr/sbin/lctl mark .\/compilebench -D \/mnt\/lustre\/d0.compilebench -i 1         -r 2 --makej
11:00:40:Lustre: DEBUG MARKER: ./compilebench -D /mnt/lustre/d0.compilebench -i 1 -r 2 --makej
11:08:26:LustreError: 8551:0:(vvp_io.c:1078:vvp_io_commit_write()) Write page 3250 of inode ffff88001916d1b8 failed -28
11:08:28:LustreError: 8551:0:(vvp_io.c:1078:vvp_io_commit_write()) Write page 3250 of inode ffff88001916d1b8 failed -28
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;OST console shows:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;11:00:42:Lustre: DEBUG MARKER: /usr/sbin/lctl mark .\/compilebench -D \/mnt\/lustre\/d0.compilebench -i 1         -r 2 --makej
11:00:43:Lustre: DEBUG MARKER: ./compilebench -D /mnt/lustre/d0.compilebench -i 1 -r 2 --makej
11:05:07:LustreError: 20425:0:(ofd_grant.c:255:ofd_grant_space_left()) lustre-OST0004: cli lustre-OST0004_UUID/ffff880021d8d000 left 44863488 &amp;lt; tot_grant 47737472 unstable 0 pending 0
11:05:07:LustreError: 20425:0:(ofd_grant.c:255:ofd_grant_space_left()) Skipped 6 previous similar messages
11:05:07:LustreError: 21683:0:(ofd_grant.c:255:ofd_grant_space_left()) lustre-OST0004: cli 009dd603-5497-a62c-77c6-19fda0311814/ffff880021d8ec00 left 44863488 &amp;lt; tot_grant 47735680 unstable 0 pending 0
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>server and client: lustre-master build #1652</environment>
        <key id="20857">LU-3906</key>
            <summary>Failure on test suite parallel-scale test_compilebench: IOError, No space left on device</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="yujian">Jian Yu</assignee>
                                    <reporter username="sarah">Sarah Liu</reporter>
                        <labels>
                    </labels>
                <created>Sun, 8 Sep 2013 21:24:06 +0000</created>
                <updated>Tue, 31 Dec 2013 16:31:08 +0000</updated>
                            <resolved>Sat, 23 Nov 2013 14:22:52 +0000</resolved>
                                    <version>Lustre 2.4.1</version>
                    <version>Lustre 2.5.0</version>
                    <version>Lustre 2.6.0</version>
                                    <fixVersion>Lustre 2.6.0</fixVersion>
                    <fixVersion>Lustre 2.4.2</fixVersion>
                    <fixVersion>Lustre 2.5.1</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="70587" author="yujian" created="Mon, 4 Nov 2013 04:56:50 +0000"  >&lt;p&gt;Lustre build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/47/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/47/&lt;/a&gt;&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;/p&gt;

&lt;p&gt;FSTYPE=zfs&lt;br/&gt;
MDSCOUNT=1&lt;br/&gt;
MDSSIZE=2097152&lt;br/&gt;
OSTCOUNT=2&lt;br/&gt;
OSTSIZE=2097152&lt;/p&gt;

&lt;p&gt;parallel-scale test compilebench failed as follows:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;create dir kernel-0 222MB in 459.56 seconds (0.48 MB/s)
Traceback (most recent call last):
  File &quot;./compilebench&quot;, line 576, in &amp;lt;module&amp;gt;
    mbs = run_directory(dset.unpatched, dirname, &quot;create dir&quot;)
  File &quot;./compilebench&quot;, line 245, in run_directory
    fp.close()
IOError: [Errno 28] No space left on device
 parallel-scale test_compilebench: @@@@@@ FAIL: compilebench failed: 1 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Console log on client node:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;10:44:00:Lustre: DEBUG MARKER: ./compilebench -D /mnt/lustre/d0.compilebench -i 2 -r 2 --makej
11:10:17:LustreError: 13106:0:(vvp_io.c:1088:vvp_io_commit_write()) Write page 3 of inode ffff880032124678 failed -28
11:10:18:LustreError: 13106:0:(vvp_io.c:1088:vvp_io_commit_write()) Write page 3 of inode ffff880032124678 failed -28
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Maloo report: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/39210a1a-4453-11e3-8472-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/39210a1a-4453-11e3-8472-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;parallel-scale-nfsv3 and parallel-scale-nfsv4 also failed:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/ce8cbd1a-4453-11e3-8472-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/ce8cbd1a-4453-11e3-8472-52540035b04c&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/fc337542-4453-11e3-8472-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/fc337542-4453-11e3-8472-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Hi Lai,&lt;br/&gt;
Is this similar to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3522&quot; title=&quot;sanity-benchmark test_iozone: &amp;quot;no space left on device&amp;quot; on ZFS&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3522&quot;&gt;&lt;del&gt;LU-3522&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;</comment>
                            <comment id="71265" author="sarah" created="Mon, 11 Nov 2013 20:46:52 +0000"  >&lt;p&gt;seen in 2.5.51 testing: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/2fb17d6c-47ea-11e3-a445-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/2fb17d6c-47ea-11e3-a445-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;IOError: [Errno 28] No space left on device
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="71292" author="yujian" created="Tue, 12 Nov 2013 01:27:19 +0000"  >&lt;p&gt;This is blocking the parallel-scale{,-nfsv3,nfsv4} testing on ZFS. I&apos;ll check whether the OSTCOUNT=2 and OSTSIZE=2097152 configuration cause the out of space failure.&lt;/p&gt;</comment>
                            <comment id="71341" author="adilger" created="Tue, 12 Nov 2013 17:35:14 +0000"  >&lt;p&gt;This is likely a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3522&quot; title=&quot;sanity-benchmark test_iozone: &amp;quot;no space left on device&amp;quot; on ZFS&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3522&quot;&gt;&lt;del&gt;LU-3522&lt;/del&gt;&lt;/a&gt; caused by the OST reserving too much grant for each client block. &lt;/p&gt;

&lt;p&gt;I&apos;m not closing it yet, in case this is actually a problem of the test trying to write more data than will fit into the 4GB of space with 2 OSTs. &lt;/p&gt;</comment>
                            <comment id="71409" author="yujian" created="Wed, 13 Nov 2013 13:00:32 +0000"  >&lt;p&gt;After running compilebench test manually on master branch, I found that the required space for one kernel directory was about 1GB instead of 680MB. For two directories, the test will consume about 2GB space which should not fill up 4GB space. So, this is a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3522&quot; title=&quot;sanity-benchmark test_iozone: &amp;quot;no space left on device&amp;quot; on ZFS&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3522&quot;&gt;&lt;del&gt;LU-3522&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;Here is the patch for master branch to fix the space estimation codes in run_compilebench(): &lt;a href=&quot;http://review.whamcloud.com/8258&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8258&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="71609" author="yujian" created="Fri, 15 Nov 2013 05:28:42 +0000"  >&lt;p&gt;Lustre build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/50/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/50/&lt;/a&gt;&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;/p&gt;

&lt;p&gt;FSTYPE=zfs&lt;br/&gt;
MDSCOUNT=1&lt;br/&gt;
MDSSIZE=2097152&lt;br/&gt;
OSTCOUNT=2&lt;br/&gt;
OSTSIZE=2097152&lt;br/&gt;
PTLDEBUG=-1&lt;br/&gt;
DEBUG_SIZE=128&lt;/p&gt;

&lt;p&gt;While parallel-scale test compilebench hitting &quot;No space left on device&quot; failure, the space usage status of the Lustre filesystem was as follows:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;create dir kernel-0 222MB in 344.06 seconds (0.65 MB/s)
Traceback (most recent call last):
  File &quot;./compilebench&quot;, line 576, in &amp;lt;module&amp;gt;
    mbs = run_directory(dset.unpatched, dirname, &quot;create dir&quot;)
  File &quot;./compilebench&quot;, line 245, in run_directory
    fp.close()
IOError: [Errno 28] No space left on device

du -sh /mnt/lustre/*
27M	/mnt/lustre/d0.compilebench

du -sh /mnt/lustre/d0.compilebench/*
19M	/mnt/lustre/d0.compilebench/kernel-0
7.6M	/mnt/lustre/d0.compilebench/kernel-1

lfs df -i
UUID                      Inodes       IUsed       IFree IUse% Mounted on
lustre-MDT0000_UUID      1149005       32051     1116954   3% /mnt/lustre[MDT:0]
lustre-OST0000_UUID        16053       15332         721  96% /mnt/lustre[OST:0]
lustre-OST0001_UUID        16080       15297         783  95% /mnt/lustre[OST:1]

filesystem summary:      1149005       32051     1116954   3% /mnt/lustre


lfs df -h
UUID                       bytes        Used   Available Use% Mounted on
lustre-MDT0000_UUID         2.0G       53.6M        1.9G   3% /mnt/lustre[MDT:0]
lustre-OST0000_UUID         2.0G        1.9G       88.1M  96% /mnt/lustre[OST:0]
lustre-OST0001_UUID         2.0G        1.9G       93.9M  95% /mnt/lustre[OST:1]

filesystem summary:         3.9G        3.7G      182.0M  95% /mnt/lustre


 parallel-scale test_compilebench: @@@@@@ FAIL: compilebench failed: 1 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Maloo report: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/082a9faa-4db5-11e3-8fb6-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/082a9faa-4db5-11e3-8fb6-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="71623" author="yujian" created="Fri, 15 Nov 2013 14:06:03 +0000"  >&lt;p&gt;Here is the patch for Lustre b2_4 branch to fix the space estimation codes in run_compilebench(): &lt;a href=&quot;http://review.whamcloud.com/8288&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8288&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="72106" author="yujian" created="Fri, 22 Nov 2013 08:04:57 +0000"  >&lt;p&gt;Patch landed on Lustre b2_4 branch. The real issue is &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3522&quot; title=&quot;sanity-benchmark test_iozone: &amp;quot;no space left on device&amp;quot; on ZFS&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3522&quot;&gt;&lt;del&gt;LU-3522&lt;/del&gt;&lt;/a&gt;, which still needs to be fixed.&lt;/p&gt;</comment>
                            <comment id="72185" author="pjones" created="Sat, 23 Nov 2013 14:22:52 +0000"  >&lt;p&gt;Landed for 2.6&lt;/p&gt;</comment>
                            <comment id="72465" author="yujian" created="Thu, 28 Nov 2013 07:20:24 +0000"  >&lt;p&gt;In the current run_compilebench(), lfs_df is used to get the free disk space usage information. However, run_compilebench() will also be run on NFS client which has no Lustre filesystem, so we need change lfs_df to df. Here are the patches:&lt;br/&gt;
For master branch: &lt;a href=&quot;http://review.whamcloud.com/8429&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8429&lt;/a&gt;&lt;br/&gt;
For b2_4 branch: &lt;a href=&quot;http://review.whamcloud.com/8430&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8430&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="19589">LU-3522</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="20863">LU-3912</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="20864">LU-3913</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="20860">LU-3909</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="20855">LU-3904</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="20856">LU-3905</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw1cv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>10301</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>