<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:37:52 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-3896] racer test hung: /mnt/lustre2 is still busy, wait one second</title>
                <link>https://jira.whamcloud.com/browse/LU-3896</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;racer test hung as follows:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;== racer test complete, duration 1006 sec == 00:42:55 (1378194175)
CMD: wtm-29vm3 /usr/sbin/lctl get_param -n version
CMD: wtm-29vm3 /usr/sbin/lctl conf_param lustre.quota.mdt=ug
CMD: wtm-29vm3 /usr/sbin/lctl conf_param lustre.quota.ost=ug
Stopping clients: wtm-29vm5,wtm-29vm6.rosso.whamcloud.com /mnt/lustre2 (opts:)
CMD: wtm-29vm5,wtm-29vm6.rosso.whamcloud.com running=\$(grep -c /mnt/lustre2&apos; &apos; /proc/mounts);
if [ \$running -ne 0 ] ; then
echo Stopping client \$(hostname) /mnt/lustre2 opts:;
lsof /mnt/lustre2 || need_kill=no;
if [ x != x -a x\$need_kill != xno ]; then
    pids=\$(lsof -t /mnt/lustre2 | sort -u);
    if [ -n \&quot;\$pids\&quot; ]; then
             kill -9 \$pids;
    fi
fi;
while umount  /mnt/lustre2 2&amp;gt;&amp;amp;1 | grep -q busy; do
    echo /mnt/lustre2 is still busy, wait one second &amp;amp;&amp;amp; sleep 1;
done;
fi
Stopping client wtm-29vm6.rosso.whamcloud.com /mnt/lustre2 opts:
Stopping client wtm-29vm5.rosso.whamcloud.com /mnt/lustre2 opts:
COMMAND   PID USER   FD   TYPE      DEVICE SIZE/OFF               NODE NAME
dd       3713 root    1w   REG 1273,181606  7769088 450359979933698183 /mnt/lustre/racer1/6 (deleted)
dd      10024 root    1w   REG 1273,181606 99767296 450359979950473219 /mnt/lustre2/racer1/2 (deleted)
dd      10031 root    1w   REG 1273,181606  9411584 450359979967250450 /mnt/lustre2/racer1/12
dd      10059 root    1w   REG 1273,181606 85909504 432345581440991292 /mnt/lustre2/racer/6
dd      10062 root    1w   REG 1273,181606 56402944 432345581440991267 /mnt/lustre/racer/8
dd      10074 root    1w   REG 1273,181606 47879168 432345581457768455 /mnt/lustre/racer/9
dd      10076 root    1w   REG 1273,181606 45958144 432345581407436811 /mnt/lustre2/racer/13
dd      10084 root    1w   REG 1273,181606 47879168 432345581457768455 /mnt/lustre/racer/9
dd      10130 root    1w   REG 1273,181606 18804736 468374378443178004 /mnt/lustre/racer2/13
dd      10173 root    1w   REG 1273,181606 55358464 486388776969437193 /mnt/lustre/racer3/6
dd      10421 root    1w   REG 1273,181606  2441216 486388776952660004 /mnt/lustre/racer3/10
dd      10450 root    1w   REG 1273,181606 50086912 468374378476732457 /mnt/lustre/racer2/0
dd      10456 root    1w   REG 1273,181606 31876096 468374378443178023 /mnt/lustre/racer2/13 (deleted)
dd      10457 root    1w   REG 1273,181606 64463872 486388776952660005 /mnt/lustre/racer3/19
dd      10527 root    1w   REG 1273,181606  2441216 486388776952660004 /mnt/lustre2/racer3/10
dd      10581 root    1w   REG 1273,181606  7365632 468374378459955230 /mnt/lustre2/racer2/11
dd      11360 root    1w   REG 1273,181606 57447424 450359979967250475 /mnt/lustre2/racer1/10
cat     11906 root    1w   REG 1273,181606 10503168 486388776935882790 /mnt/lustre2/racer3/2 (deleted)
cat     11906 root    3r   REG 1273,181606 39769088 486388776986214418 /mnt/lustre2/racer3/5
dd      11947 root    1w   REG 1273,181606 10503168 486388776935882790 /mnt/lustre2/racer3/2 (deleted)
cat     12675 root    1w   REG 1273,181606  8477696 450359979933696110 /mnt/lustre/racer1/1 (deleted)
cat     12675 root    3r   REG 1273,181606  8478720 450359979933696048 /mnt/lustre/racer1/5
dd      15141 root    1w   REG 1273,181606 58491904 468374378476732558 /mnt/lustre2/racer2/3 (deleted)
dd      21547 root    1w   REG 1273,181606 32379904 468374378476734932 /mnt/lustre2/racer2/5
dd      29365 root    1w   REG 1273,181606 61625344 450359979916919106 /mnt/lustre/racer1/0
/mnt/lustre2 is still busy, wait one second
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Console log on client wtm-29vm6 showed that:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00:42:04:cat           D 0000000000000000     0  4282   2714 0x00000080
00:42:04: ffff880062aefc90 0000000000000082 0000000000000246 000000100000000d
00:42:04: ffffffff00000050 ffffffffa06b3390 ffff88006c91e1e8 ffff88006c91ca28
00:42:04: ffff880065a2f058 ffff880062aeffd8 000000000000fb88 ffff880065a2f058
00:42:04:Call Trace:
00:42:04: [&amp;lt;ffffffffa06b3390&amp;gt;] ? ldlm_completion_ast+0x0/0x960 [ptlrpc]
00:42:04: [&amp;lt;ffffffffa09a9fa0&amp;gt;] ? lov_io_init_raid0+0x3e0/0x800 [lov]
00:42:04: [&amp;lt;ffffffff81510695&amp;gt;] rwsem_down_failed_common+0x95/0x1d0
00:42:04: [&amp;lt;ffffffff81510826&amp;gt;] rwsem_down_read_failed+0x26/0x30
00:42:04: [&amp;lt;ffffffff81283844&amp;gt;] call_rwsem_down_read_failed+0x14/0x30
00:42:04: [&amp;lt;ffffffff8150fd24&amp;gt;] ? down_read+0x24/0x30
00:42:04: [&amp;lt;ffffffffa0a7182d&amp;gt;] ll_file_io_generic+0x29d/0x600 [lustre]
00:42:04: [&amp;lt;ffffffffa0a71ccf&amp;gt;] ll_file_aio_read+0x13f/0x2c0 [lustre]
00:42:04: [&amp;lt;ffffffffa0a7256c&amp;gt;] ll_file_read+0x16c/0x2a0 [lustre]
00:42:04: [&amp;lt;ffffffff81181a95&amp;gt;] vfs_read+0xb5/0x1a0
00:42:04: [&amp;lt;ffffffff81181bd1&amp;gt;] sys_read+0x51/0x90
00:42:04: [&amp;lt;ffffffff810dc685&amp;gt;] ? __audit_syscall_exit+0x265/0x290
00:42:04: [&amp;lt;ffffffff8100b072&amp;gt;] system_call_fastpath+0x16/0x1b
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Stack trace on client wtm-29vm5 showed that:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;dd            S 0000000000000000     0  3713      1 0x00000080
 ffff880042549bd8 0000000000000086 ffffffffa0581e5c ffff8800679bf5b8
 0000000000000002 ffff880067ac4040 ffff880042549be8 ffffffffa055d35c
 ffff880067ac45f8 ffff880042549fd8 000000000000fb88 ffff880067ac45f8
Call Trace:
 [&amp;lt;ffffffffa055d35c&amp;gt;] ? cl_lock_trace0+0x11c/0x130 [obdclass]
 [&amp;lt;ffffffffa0554825&amp;gt;] ? cl_env_info+0x15/0x20 [obdclass]
 [&amp;lt;ffffffffa03d86fe&amp;gt;] cfs_waitq_wait+0xe/0x10 [libcfs]
 [&amp;lt;ffffffffa056171a&amp;gt;] cl_lock_state_wait+0x1aa/0x320 [obdclass]
 [&amp;lt;ffffffff81063410&amp;gt;] ? default_wake_function+0x0/0x20
 [&amp;lt;ffffffffa0561f0b&amp;gt;] cl_enqueue_locked+0x15b/0x1f0 [obdclass]
 [&amp;lt;ffffffffa0562a8e&amp;gt;] cl_lock_request+0x7e/0x270 [obdclass]
 [&amp;lt;ffffffffa0567d2c&amp;gt;] cl_io_lock+0x3cc/0x560 [obdclass]
 [&amp;lt;ffffffffa0567f62&amp;gt;] cl_io_loop+0xa2/0x1b0 [obdclass]
 [&amp;lt;ffffffffa09df9e0&amp;gt;] ll_file_io_generic+0x450/0x600 [lustre]
 [&amp;lt;ffffffffa09e0922&amp;gt;] ll_file_aio_write+0x142/0x2c0 [lustre]
 [&amp;lt;ffffffffa09e0c0c&amp;gt;] ll_file_write+0x16c/0x2a0 [lustre]
 [&amp;lt;ffffffff81181368&amp;gt;] vfs_write+0xb8/0x1a0
 [&amp;lt;ffffffff81181c61&amp;gt;] sys_write+0x51/0x90
 [&amp;lt;ffffffff810dc685&amp;gt;] ? __audit_syscall_exit+0x265/0x290
 [&amp;lt;ffffffff8100b072&amp;gt;] system_call_fastpath+0x16/0x1b
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Maloo report: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/66e0f40c-1649-11e3-aa2a-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/66e0f40c-1649-11e3-aa2a-52540035b04c&lt;/a&gt;&lt;/p&gt;</description>
                <environment>&lt;br/&gt;
Lustre build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/44/&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/44/&lt;/a&gt; (2.4.1 RC1)&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;br/&gt;
FSTYPE=zfs&lt;br/&gt;
MDSCOUNT=4&lt;br/&gt;
</environment>
        <key id="20824">LU-3896</key>
            <summary>racer test hung: /mnt/lustre2 is still busy, wait one second</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="yujian">Jian Yu</reporter>
                        <labels>
                            <label>dne</label>
                            <label>yuc2</label>
                            <label>zfs</label>
                    </labels>
                <created>Fri, 6 Sep 2013 13:59:00 +0000</created>
                <updated>Sun, 10 Oct 2021 22:36:44 +0000</updated>
                            <resolved>Sun, 10 Oct 2021 22:36:44 +0000</resolved>
                                    <version>Lustre 2.4.1</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="65963" author="green" created="Fri, 6 Sep 2013 16:38:22 +0000"  >&lt;p&gt;This might be more fallout from &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3027&quot; title=&quot;Failure on test suite parallel-scale test_write_disjoint: invalid file size 140329 instead of 160376 = 20047 * 8&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3027&quot;&gt;&lt;del&gt;LU-3027&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="72289" author="yujian" created="Tue, 26 Nov 2013 07:53:51 +0000"  >&lt;p&gt;Lustre Build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/58/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/58/&lt;/a&gt;&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;/p&gt;

&lt;p&gt;FSTYPE=zfs&lt;br/&gt;
MDSCOUNT=1&lt;br/&gt;
MDSSIZE=2097152&lt;br/&gt;
OSTCOUNT=2&lt;br/&gt;
OSTSIZE=2097152&lt;/p&gt;

&lt;p&gt;racer test hit the same failure again:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/d73fa562-5605-11e3-8e94-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/d73fa562-5605-11e3-8e94-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;The same test passed in manual run:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sessions/2a310d0a-567a-11e3-82a8-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sessions/2a310d0a-567a-11e3-82a8-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="128699" author="standan" created="Tue, 29 Sep 2015 01:19:38 +0000"  >&lt;p&gt;Also observed the same issue in suite_log of replay-dual for interop testing for 2.7.60 tag&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/f5135c3c-62dd-11e5-b25a-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/f5135c3c-62dd-11e5-b25a-5254006e85c2&lt;/a&gt;&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;while umount  /mnt/lustre2 2&amp;gt;&amp;amp;1 | grep -q busy; do
    echo /mnt/lustre2 is still busy, wait one second &amp;amp;&amp;amp; sleep 1;
done;
fi
Stopping client onyx-38vm6.onyx.hpdd.intel.com /mnt/lustre2 opts:
Stopping client onyx-38vm5.onyx.hpdd.intel.com /mnt/lustre2 opts:
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw0nj:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>10186</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>