<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:28:34 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2829] Timeout on sanityn test_33a: zfs slow when commit_on_sharing enabled</title>
                <link>https://jira.whamcloud.com/browse/LU-2829</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for sarah &amp;lt;sarah@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/2b779918-7787-11e2-987d-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/2b779918-7787-11e2-987d-52540035b04c&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;The sub-test test_33a failed with the following error:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;test failed to respond and timed out&lt;/p&gt;&lt;/blockquote&gt;
</description>
                <environment></environment>
        <key id="17614">LU-2829</key>
            <summary>Timeout on sanityn test_33a: zfs slow when commit_on_sharing enabled</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="utopiabound">Nathaniel Clark</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                            <label>performance</label>
                            <label>zfs</label>
                    </labels>
                <created>Mon, 18 Feb 2013 20:08:15 +0000</created>
                <updated>Tue, 31 Dec 2013 15:54:00 +0000</updated>
                            <resolved>Mon, 2 Dec 2013 18:38:20 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                    <version>Lustre 2.4.1</version>
                    <version>Lustre 2.5.0</version>
                                    <fixVersion>Lustre 2.6.0</fixVersion>
                    <fixVersion>Lustre 2.4.2</fixVersion>
                    <fixVersion>Lustre 2.5.1</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="52667" author="keith" created="Mon, 18 Feb 2013 22:47:37 +0000"  >&lt;p&gt;Also the test reports&lt;br/&gt;
test_33a 	&lt;br/&gt;
    Error: &apos;test failed to respond and timed out&apos;&lt;br/&gt;
    Failure Rate: 100.00% of last 100 executions &lt;span class=&quot;error&quot;&gt;&amp;#91;all branches&amp;#93;&lt;/span&gt; &lt;/p&gt;

&lt;p&gt;The systems look like they just waited around for an hours.  &lt;/p&gt;

&lt;p&gt;The test log as a good bit of &quot;/proc/fs/jbd2/mdt1:*/info: No such file or directory&quot; in it.  I am guessing the test got lost.  I don&apos;t expect zfs to have jbd2 business. &lt;/p&gt;</comment>
                            <comment id="53020" author="utopiabound" created="Tue, 26 Feb 2013 03:54:03 +0000"  >&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/5530&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/5530&lt;/a&gt; - ABANDONED&lt;/p&gt;</comment>
                            <comment id="53168" author="utopiabound" created="Thu, 28 Feb 2013 03:58:34 +0000"  >&lt;p&gt;Fix for 33a and 33b need to fix assumptions about device names for these tests to be useful even on autotests since they use dm devices.&lt;/p&gt;</comment>
                            <comment id="53169" author="utopiabound" created="Thu, 28 Feb 2013 04:11:45 +0000"  >&lt;p&gt;This particular failure is not actually related to zfs proc entries.&lt;/p&gt;

&lt;p&gt;One of the createmany processes (run on client1) seems to go out to lunch&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt; 17:43:26 client-19vm1 xinetd[5727]: START: mshell pid=4698 from=::ffff:10.10.4.220
Feb 14 17:43:26 client-19vm1 mrshd[4699]: root@client-19vm1.lab.whamcloud.com as root: cmd=&apos;(PATH=$PATH:/usr/lib64/lustre/utils:/usr/lib64/lustre/tests:/sbin:/usr/sbin; cd /usr/lib64/lustre/tests; LUSTRE=&quot;/usr/lib64/lustre&quot;  MGSFSTYPE=zfs MDSFSTYPE=zfs OSTFSTYPE=zfs FSTYPE=zfs sh -c &quot;createmany -o /mnt/lustre/d0.sanityn/d33-\$(hostname)-1/f- -r /mnt/lustre2/d0.sanityn/d33-\$(hostname)-1/f- 10000 &amp;gt; /dev/null 2&amp;gt;&amp;amp;1&quot;);echo XXRETCODE:$?&apos;
Feb 14 18:40:17 client-19vm1 xinetd[5727]: START: shell pid=28648 from=::ffff:10.10.4.220
Feb 14 18:40:17 client-19vm1 rshd[28650]: autotest@client-19vm1.lab.whamcloud.com as root: cmd=&apos;/home/autotest/.autotest/dynamic_bash/70180499028200+1360896014.64875&apos;
Feb 14 18:40:18 client-19vm1 kernel: SysRq : Show State
...
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;OST has one process blocked on:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;18:41:13:txg_sync      D 0000000000000000     0  2707      2 0x00000080
18:41:13: ffff88007c881bc0 0000000000000046 ffff88007cecf680 0000000000000086
18:41:13: ffff88007c881b70 ffff88007cfeda48 0000000000000001 ffff88007cfeda60
18:41:13: ffff8800796a9af8 ffff88007c881fd8 000000000000fb88 ffff8800796a9af8
18:41:13:Call Trace:
18:41:13: [&amp;lt;ffffffff81090b9e&amp;gt;] ? prepare_to_wait_exclusive+0x4e/0x80
18:41:13: [&amp;lt;ffffffffa016b5ac&amp;gt;] cv_wait_common+0x9c/0x1a0 [spl]
18:41:13: [&amp;lt;ffffffffa02d5160&amp;gt;] ? zio_execute+0x0/0xf0 [zfs]
18:41:13: [&amp;lt;ffffffff81090990&amp;gt;] ? autoremove_wake_function+0x0/0x40
18:41:13: [&amp;lt;ffffffffa016b6e3&amp;gt;] __cv_wait+0x13/0x20 [spl]
18:41:13: [&amp;lt;ffffffffa02d533b&amp;gt;] zio_wait+0xeb/0x160 [zfs]
18:41:13: [&amp;lt;ffffffffa026b807&amp;gt;] dsl_pool_sync+0x2a7/0x480 [zfs]
18:41:13: [&amp;lt;ffffffffa027e147&amp;gt;] spa_sync+0x397/0x9a0 [zfs]
18:41:13: [&amp;lt;ffffffffa028fd41&amp;gt;] txg_sync_thread+0x2c1/0x490 [zfs]
18:41:13: [&amp;lt;ffffffff810527f9&amp;gt;] ? set_user_nice+0xc9/0x130
18:41:13: [&amp;lt;ffffffffa028fa80&amp;gt;] ? txg_sync_thread+0x0/0x490 [zfs]
18:41:13: [&amp;lt;ffffffffa0164668&amp;gt;] thread_generic_wrapper+0x68/0x80 [spl]
18:41:13: [&amp;lt;ffffffffa0164600&amp;gt;] ? thread_generic_wrapper+0x0/0x80 [spl]
18:41:14: [&amp;lt;ffffffff81090626&amp;gt;] kthread+0x96/0xa0
18:41:14: [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
18:41:14: [&amp;lt;ffffffff81090590&amp;gt;] ? kthread+0x0/0xa0
18:41:14: [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This txg_sync stack trace looks very similar to the one posted in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2887&quot; title=&quot;sanity-quota test_12a: slow due to ZFS VMs sharing single disk&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2887&quot;&gt;&lt;del&gt;LU-2887&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="53823" author="utopiabound" created="Tue, 12 Mar 2013 20:10:33 +0000"  >&lt;p&gt;This test will complete on ZFS but it takes an inordinate amount of time (usually slightly over 1 hour).&lt;/p&gt;

&lt;p&gt;zfs times:&lt;br/&gt;
commit_on_sharing=0  ~58s&lt;br/&gt;
commit_on_sharing=1  ~1300s&lt;/p&gt;

&lt;p&gt;ldiskfs times:&lt;br/&gt;
commit_on_sharing=0  ~58s&lt;br/&gt;
commit_on_sharing=1  ~240s&lt;/p&gt;</comment>
                            <comment id="53824" author="utopiabound" created="Tue, 12 Mar 2013 20:11:12 +0000"  >&lt;p&gt;Patch to make logging print fewer errors:&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/5693&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/5693&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="53965" author="pjones" created="Wed, 13 Mar 2013 19:33:12 +0000"  >&lt;p&gt;Landed for 2.4&lt;/p&gt;</comment>
                            <comment id="54007" author="utopiabound" created="Thu, 14 Mar 2013 09:18:08 +0000"  >&lt;p&gt;The core issue isn&apos;t resolved.  This could be de-prioritized because the test will EVENTUALLY pass, just not within a reasonable time.&lt;/p&gt;

&lt;p&gt;The speed is probably related to bug &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2887&quot; title=&quot;sanity-quota test_12a: slow due to ZFS VMs sharing single disk&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2887&quot;&gt;&lt;del&gt;LU-2887&lt;/del&gt;&lt;/a&gt; and ilk.&lt;/p&gt;</comment>
                            <comment id="64075" author="yujian" created="Mon, 12 Aug 2013 11:55:07 +0000"  >&lt;p&gt;Lustre build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/29/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/29/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;With FSTYPE=zfs, sanityn test 33a cannot pass within 3600s:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/3fbb7eca-0257-11e3-b384-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/3fbb7eca-0257-11e3-b384-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="65841" author="yujian" created="Thu, 5 Sep 2013 14:39:05 +0000"  >&lt;p&gt;Lustre build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/44/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/44/&lt;/a&gt; (2.4.1 RC1)&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;br/&gt;
FSTYPE=zfs&lt;/p&gt;

&lt;p&gt;sanityn test 33a timed out with 18000s:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/fbf13be0-1556-11e3-8938-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/fbf13be0-1556-11e3-8938-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="70461" author="yujian" created="Fri, 1 Nov 2013 04:51:26 +0000"  >&lt;p&gt;Lustre Build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/46/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/46/&lt;/a&gt;&lt;br/&gt;
FSTYPE=zfs&lt;/p&gt;

&lt;p&gt;sanityn test 33a timed out with 3600s:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/cff9f9da-305b-11e3-b28a-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/cff9f9da-305b-11e3-b28a-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;We&apos;ll see whether the timeout failure can disappear after TEI-790 is resolved.&lt;/p&gt;</comment>
                            <comment id="70583" author="yujian" created="Mon, 4 Nov 2013 02:54:19 +0000"  >&lt;p&gt;Even with OSTCOUNT=2, sanityn test 33a still timed out in 18000s:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/70536e32-444f-11e3-8472-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/70536e32-444f-11e3-8472-52540035b04c&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/fb7ca724-43ed-11e3-8599-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/fb7ca724-43ed-11e3-8599-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="70623" author="utopiabound" created="Mon, 4 Nov 2013 16:19:48 +0000"  >&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/8161&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8161&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="71517" author="yujian" created="Thu, 14 Nov 2013 11:49:34 +0000"  >&lt;p&gt;The above patch is also needed on Lustre b2_4 and b2_5 branches.&lt;/p&gt;</comment>
                            <comment id="71555" author="bogl" created="Thu, 14 Nov 2013 18:56:13 +0000"  >&lt;p&gt;backport to b2_4&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/8273&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8273&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="71622" author="utopiabound" created="Fri, 15 Nov 2013 14:03:35 +0000"  >&lt;p&gt;8161 cherry-picks over to b2_5 just fine&lt;/p&gt;</comment>
                            <comment id="71624" author="utopiabound" created="Fri, 15 Nov 2013 14:12:25 +0000"  >&lt;p&gt;Landed post 2.5.51&lt;/p&gt;</comment>
                            <comment id="72108" author="yujian" created="Fri, 22 Nov 2013 08:13:38 +0000"  >&lt;p&gt;Patch landed on Lustre b2_4 branch.&lt;/p&gt;</comment>
                            <comment id="72287" author="yujian" created="Tue, 26 Nov 2013 07:35:41 +0000"  >&lt;blockquote&gt;&lt;p&gt;backport to b2_4 &lt;a href=&quot;http://review.whamcloud.com/8273&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8273&lt;/a&gt;&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;The failure still occurred:&lt;/p&gt;

&lt;p&gt;Lustre Build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/58/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/58/&lt;/a&gt;&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;/p&gt;

&lt;p&gt;FSTYPE=zfs&lt;br/&gt;
MDSCOUNT=1&lt;br/&gt;
MDSSIZE=2097152&lt;br/&gt;
OSTCOUNT=2&lt;br/&gt;
OSTSIZE=2097152&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/0f0a6172-5605-11e3-8e94-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/0f0a6172-5605-11e3-8e94-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="72511" author="yujian" created="Fri, 29 Nov 2013 06:46:06 +0000"  >&lt;p&gt;Patches to decrease the number of files again for sanityn test 33a and 33b:&lt;br/&gt;
For master branch: &lt;a href=&quot;http://review.whamcloud.com/8440&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8440&lt;/a&gt;&lt;br/&gt;
For b2_4 branch: &lt;a href=&quot;http://review.whamcloud.com/8439&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8439&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="72593" author="yujian" created="Mon, 2 Dec 2013 14:38:35 +0000"  >&lt;p&gt;The above patches landed on master and b2_4 branches.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="22012">LU-4251</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="17731">LU-2887</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvjd3:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6852</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>