<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:41:02 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-4252] Failure on test suite racer test_1</title>
                <link>https://jira.whamcloud.com/browse/LU-4252</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for sarah &amp;lt;sarah@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;http://maloo.whamcloud.com/test_sets/03808e92-49af-11e3-9f02-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://maloo.whamcloud.com/test_sets/03808e92-49af-11e3-9f02-52540035b04c&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;The sub-test test_1 failed with the following error:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;test failed to respond and timed out&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;test log shows:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;== racer test 1: racer on clients: client-16vm1,client-16vm2 DURATION=900 ============================ 04:13:57 (1383999237)
racers pids: 28586 28587
CMD: client-16vm1,client-16vm2 DURATION=900 MDSCOUNT=1 				   /usr/lib64/lustre/tests/racer/racer.sh /mnt/lustre2/racer 
CMD: client-16vm1,client-16vm2 DURATION=900 MDSCOUNT=1 				   /usr/lib64/lustre/tests/racer/racer.sh /mnt/lustre/racer 
client-16vm2: file_create.sh: no process found
client-16vm2: dir_create.sh: no process found
client-16vm2: file_rm.sh: no process found
client-16vm2: file_rename.sh: no process found
client-16vm2: file_link.sh: no process found
client-16vm2: file_symlink.sh: no process found
client-16vm2: file_list.sh: no process found
client-16vm2: file_create.sh: no process found
client-16vm2: file_create.sh: no process found
client-16vm2: dir_create.sh: no process found
client-16vm2: file_rm.sh: no process found
client-16vm2: dir_create.sh: no process found
client-16vm2: file_rename.sh: no process found
client-16vm2: file_rm.sh: no process found
client-16vm2: file_link.sh: no process found
client-16vm2: file_rename.sh: no process found
client-16vm2: file_symlink.sh: no process found
client-16vm2: file_link.sh: no process found
client-16vm2: file_list.sh: no process found
client-16vm2: file_symlink.sh: no process found
client-16vm2: file_concat.sh: no process found
client-16vm2: file_list.sh: no process found
client-16vm2: file_exec.sh: no process found
client-16vm2: file_concat.sh: no process found
client-16vm2: file_exec.sh: no process found
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>lustre-master build # 1753 ldiskfs  &lt;br/&gt;
client is running SLES11 SP3</environment>
        <key id="22014">LU-4252</key>
            <summary>Failure on test suite racer test_1</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Thu, 14 Nov 2013 18:43:41 +0000</created>
                <updated>Fri, 15 Nov 2019 20:51:15 +0000</updated>
                            <resolved>Thu, 20 Mar 2014 12:42:57 +0000</resolved>
                                    <version>Lustre 2.6.0</version>
                    <version>Lustre 2.5.1</version>
                                    <fixVersion>Lustre 2.6.0</fixVersion>
                    <fixVersion>Lustre 2.5.2</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="73251" author="adilger" created="Tue, 10 Dec 2013 23:27:47 +0000"  >&lt;p&gt;John,&lt;br/&gt;
Could you please take a look if this is different that the many other racer bugs we have?  There are quite a few and I don&apos;t know the subtleties of each one. &lt;/p&gt;</comment>
                            <comment id="73253" author="jhammond" created="Tue, 10 Dec 2013 23:49:33 +0000"  >&lt;p&gt;Sorry, I can&apos;t tell from what&apos;s on maloo. It looks like a client rebooted but there are no console files for either client.&lt;/p&gt;</comment>
                            <comment id="74370" author="yujian" created="Mon, 6 Jan 2014 03:24:47 +0000"  >&lt;p&gt;Lustre Build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_5/5/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_5/5/&lt;/a&gt;&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64(server), SLES11SP3/x86_64(client)&lt;/p&gt;

&lt;p&gt;The same failure occurred:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/2dbe5d7a-7640-11e3-b3c0-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/2dbe5d7a-7640-11e3-b3c0-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="79133" author="green" created="Wed, 12 Mar 2014 15:38:48 +0000"  >&lt;p&gt;Two threads that appear to be deadlocked:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[34058.700432] ldlm_elt &#160; &#160; &#160; &#160;D ffff880062ffe010 &#160; &#160; 0 32149 &#160; &#160; &#160;2 0x00000000
[34058.700432] &#160;ffff880062fff9f8 0000000000000046 ffff880062ffe010 0000000000011800
[34058.700432] &#160;0000000000011800 0000000000011800 0000000000011800 ffff880062ffffd8
[34058.700432] &#160;ffff880062ffffd8 0000000000011800 ffff88006b7103c0 ffff8800772e8140
[34058.700432] Call Trace:
[34058.700432] &#160;[&amp;lt;ffffffff8145fda8&amp;gt;] __mutex_lock_slowpath+0xf8/0x150
[34058.700432] &#160;[&amp;lt;ffffffff8145f83a&amp;gt;] mutex_lock+0x1a/0x40
[34058.700432] &#160;[&amp;lt;ffffffffa062cfc5&amp;gt;] ldiskfs_sync_file+0xc5/0x360 [ldiskfs]
[34058.700432] &#160;[&amp;lt;ffffffffa0e66b9c&amp;gt;] osd_object_sync+0x11c/0x150 [osd_ldiskfs]
[34058.700432] &#160;[&amp;lt;ffffffffa0ee8590&amp;gt;] ofd_sync+0x540/0x930 [ofd]
[34058.700432] &#160;[&amp;lt;ffffffffa0dd802f&amp;gt;] obd_sync+0xdf/0x240 [ost]
[34058.700432] &#160;[&amp;lt;ffffffffa0de72aa&amp;gt;] ost_blocking_ast+0x48a/0xee0 [ost]
[34058.700432] &#160;[&amp;lt;ffffffffa09d910f&amp;gt;] ldlm_cancel_callback+0x5f/0x180 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa09d9284&amp;gt;] ldlm_lock_cancel+0x54/0x1e0 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa09da1ef&amp;gt;] ldlm_cancel_locks_for_export_cb+0x8f/0x200 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa06b3ba8&amp;gt;] cfs_hash_for_each_relax+0x178/0x340 [libcfs]
[34058.700432] &#160;[&amp;lt;ffffffffa06b5cae&amp;gt;] cfs_hash_for_each_empty+0x10e/0x1f0 [libcfs]
[34058.700432] &#160;[&amp;lt;ffffffffa09d59f6&amp;gt;] ldlm_cancel_locks_for_export+0x26/0x30 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa09e6bad&amp;gt;] server_disconnect_export+0x5d/0x1a0 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa0ede6c0&amp;gt;] ofd_obd_disconnect+0x60/0x1f0 [ofd]
[34058.700432] &#160;[&amp;lt;ffffffffa07b2528&amp;gt;] class_fail_export+0x118/0x580 [obdclass]
[34058.700432] &#160;[&amp;lt;ffffffffa09ff52f&amp;gt;] expired_lock_main+0x41f/0x880 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffff81082966&amp;gt;] kthread+0x96/0xa0
[34058.700432] &#160;[&amp;lt;ffffffff81469ee4&amp;gt;] kernel_thread_helper+0x4/0x10
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;vs&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[34058.700432] ldlm_cn00_003 &#160; D ffff8800691ffa88 &#160; &#160; 0 &#160;1252 &#160; &#160; &#160;2 0x00000000
[34058.700432] &#160;ffff8800691ffa50 0000000000000046 ffff8800691fe010 0000000000011800
[34058.700432] &#160;0000000000011800 0000000000011800 0000000000011800 ffff8800691fffd8
[34058.700432] &#160;ffff8800691fffd8 0000000000011800 ffff88006e08a5c0 ffff88007bcae300
[34058.700432] Call Trace:
[34058.700432] &#160;[&amp;lt;ffffffffa0612205&amp;gt;] jbd2_log_wait_commit+0xb5/0x130 [jbd2]
[34058.700432] &#160;[&amp;lt;ffffffffa062d0dd&amp;gt;] ldiskfs_sync_file+0x1dd/0x360 [ldiskfs]
[34058.700432] &#160;[&amp;lt;ffffffffa0e66b9c&amp;gt;] osd_object_sync+0x11c/0x150 [osd_ldiskfs]
[34058.700432] &#160;[&amp;lt;ffffffffa0ee8590&amp;gt;] ofd_sync+0x540/0x930 [ofd]
[34058.700432] &#160;[&amp;lt;ffffffffa0dd802f&amp;gt;] obd_sync+0xdf/0x240 [ost]
[34058.700432] &#160;[&amp;lt;ffffffffa0de72aa&amp;gt;] ost_blocking_ast+0x48a/0xee0 [ost]
[34058.700432] &#160;[&amp;lt;ffffffffa09d910f&amp;gt;] ldlm_cancel_callback+0x5f/0x180 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa09d9284&amp;gt;] ldlm_lock_cancel+0x54/0x1e0 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa09fcdcb&amp;gt;] ldlm_request_cancel+0x25b/0x420 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa09fd0d5&amp;gt;] ldlm_handle_cancel+0x145/0x250 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa0a02329&amp;gt;] ldlm_cancel_handler+0x1e9/0x510 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa0a32fcb&amp;gt;] ptlrpc_server_handle_request+0x37b/0xcd0 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffffa0a35627&amp;gt;] ptlrpc_main+0x917/0xd70 [ptlrpc]
[34058.700432] &#160;[&amp;lt;ffffffff81082966&amp;gt;] kthread+0x96/0xa0
[34058.700432] &#160;[&amp;lt;ffffffff81469ee4&amp;gt;] kernel_thread_helper+0x4/0x10
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="79140" author="pjones" created="Wed, 12 Mar 2014 15:59:19 +0000"  >&lt;p&gt;Hongchao&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="79233" author="hongchao.zhang" created="Thu, 13 Mar 2014 14:10:43 +0000"  >&lt;p&gt;thread &quot;ll_ost_io00_037&quot; has started journal but can&apos;t get the &quot;i_mutex&quot; lock.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;ll_ost_io00_037 D ffff880048206010     0  1448      2 0x00000000
[34058.700432]  ffff880048207a38 0000000000000046 ffff880048206010 0000000000011800
[34058.700432]  0000000000011800 0000000000011800 0000000000011800 ffff880048207fd8
[34058.700432]  ffff880048207fd8 0000000000011800 ffff880048204080 ffff880068ea6200
[34058.700432] Call Trace:
[34058.700432]  [&amp;lt;ffffffff8145fda8&amp;gt;] __mutex_lock_slowpath+0xf8/0x150
[34058.700432]  [&amp;lt;ffffffff8145f83a&amp;gt;] mutex_lock+0x1a/0x40
[34058.700432]  [&amp;lt;ffffffffa0e83649&amp;gt;] osd_punch+0x479/0x610 [osd_ldiskfs]
[34058.700432]  [&amp;lt;ffffffffa0ef1bd1&amp;gt;] ofd_object_punch+0x741/0x960 [ofd]
[34058.700432]  [&amp;lt;ffffffffa0ee71ed&amp;gt;] ofd_punch+0x5dd/0xb20 [ofd]
[34058.700432]  [&amp;lt;ffffffffa0de493f&amp;gt;] ost_punch+0x3af/0xa30 [ost]
[34058.700432]  [&amp;lt;ffffffffa0de6b1e&amp;gt;] ost_handle+0x1b5e/0x1e60 [ost]
[34058.700432]  [&amp;lt;ffffffffa0a32fcb&amp;gt;] ptlrpc_server_handle_request+0x37b/0xcd0 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa0a35627&amp;gt;] ptlrpc_main+0x917/0xd70 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffff81082966&amp;gt;] kthread+0x96/0xa0
[34058.700432]  [&amp;lt;ffffffff81469ee4&amp;gt;] kernel_thread_helper+0x4/0x10
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;thread ldlm_cn00_003 got the &quot;i_mutex&quot; lock and start to commit the journal, but the above thread holding one journal handle,&lt;br/&gt;
then the journal can&apos;t be committed. &lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[34058.700432] ldlm_cn00_003   D ffff8800691ffa88     0  1252      2 0x00000000
[34058.700432]  ffff8800691ffa50 0000000000000046 ffff8800691fe010 0000000000011800
[34058.700432]  0000000000011800 0000000000011800 0000000000011800 ffff8800691fffd8
[34058.700432]  ffff8800691fffd8 0000000000011800 ffff88006e08a5c0 ffff88007bcae300
[34058.700432] Call Trace:
[34058.700432]  [&amp;lt;ffffffffa0612205&amp;gt;] jbd2_log_wait_commit+0xb5/0x130 [jbd2]
[34058.700432]  [&amp;lt;ffffffffa062d0dd&amp;gt;] ldiskfs_sync_file+0x1dd/0x360 [ldiskfs]
[34058.700432]  [&amp;lt;ffffffffa0e66b9c&amp;gt;] osd_object_sync+0x11c/0x150 [osd_ldiskfs]
[34058.700432]  [&amp;lt;ffffffffa0ee8590&amp;gt;] ofd_sync+0x540/0x930 [ofd]
[34058.700432]  [&amp;lt;ffffffffa0dd802f&amp;gt;] obd_sync+0xdf/0x240 [ost]
[34058.700432]  [&amp;lt;ffffffffa0de72aa&amp;gt;] ost_blocking_ast+0x48a/0xee0 [ost]
[34058.700432]  [&amp;lt;ffffffffa09d910f&amp;gt;] ldlm_cancel_callback+0x5f/0x180 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa09d9284&amp;gt;] ldlm_lock_cancel+0x54/0x1e0 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa09fcdcb&amp;gt;] ldlm_request_cancel+0x25b/0x420 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa09fd0d5&amp;gt;] ldlm_handle_cancel+0x145/0x250 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa0a02329&amp;gt;] ldlm_cancel_handler+0x1e9/0x510 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa0a32fcb&amp;gt;] ptlrpc_server_handle_request+0x37b/0xcd0 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffffa0a35627&amp;gt;] ptlrpc_main+0x917/0xd70 [ptlrpc]
[34058.700432]  [&amp;lt;ffffffff81082966&amp;gt;] kthread+0x96/0xa0
[34058.700432]  [&amp;lt;ffffffff81469ee4&amp;gt;] kernel_thread_helper+0x4/0x10
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;the patch is tracked at &lt;a href=&quot;http://review.whamcloud.com/#/c/9644/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/9644/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="79552" author="hongchao.zhang" created="Tue, 18 Mar 2014 03:47:02 +0000"  >&lt;p&gt;after discussing with Yangsheng and Niu, this issue should be introduced by the patch &lt;a href=&quot;http://review.whamcloud.com/#/c/7794/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/7794/&lt;/a&gt; in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3373&quot; title=&quot;ldiskfs patches for FC19&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3373&quot;&gt;&lt;del&gt;LU-3373&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Reassign to yangsheng to fix it.&lt;/p&gt;</comment>
                            <comment id="79838" author="pjones" created="Thu, 20 Mar 2014 12:42:57 +0000"  >&lt;p&gt;Landed for 2.6&lt;/p&gt;</comment>
                            <comment id="79963" author="ys" created="Fri, 21 Mar 2014 04:16:02 +0000"  >&lt;p&gt;Port to b2_5: &lt;a href=&quot;http://review.whamcloud.com/9742&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/9742&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="29458">LU-6446</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="57402">LU-12977</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw8uf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>11590</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>