<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:48:07 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-5052] threads stuck in jbd2_journal_start</title>
                <link>https://jira.whamcloud.com/browse/LU-5052</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;MDS build up high load with no cpu activity. Lustre dumping call trace to console. (looks like dup of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4794&quot; title=&quot;MDS threads all stuck in jbd2_journal_start&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4794&quot;&gt;&lt;del&gt;LU-4794&lt;/del&gt;&lt;/a&gt;. If so please advise when the patch will land) &lt;/p&gt;

&lt;p&gt;Attached is full stack trace for all threads.&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;INFO: task ldlm_cn_00:6299 blocked &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; more than 120 seconds.
&lt;span class=&quot;code-quote&quot;&gt;&quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot;&lt;/span&gt; disables &lt;span class=&quot;code-keyword&quot;&gt;this&lt;/span&gt; message.
ldlm_cn_00    D 000000000000001a     0  6299      2 0x00000080
 ffff881ec525db30 0000000000000046 0000000000000000 ffffffff8129507e
 ffff881ec525dad0 00000000dcd2dc2e ffff881fb0bd8d00 ffff881ec525dad0
 ffff881fafe73098 ffff881ec525dfd8 000000000000fc40 ffff881fafe73098
Call Trace:
 [&amp;lt;ffffffff8129507e&amp;gt;] ? number+0x2ee/0x320
 [&amp;lt;ffffffffa055c14a&amp;gt;] start_this_handle+0x27a/0x4a0 [jbd2]
 [&amp;lt;ffffffff8108ff00&amp;gt;] ? autoremove_wake_function+0x0/0x40
 [&amp;lt;ffffffffa055c570&amp;gt;] jbd2_journal_start+0xd0/0x110 [jbd2]
 [&amp;lt;ffffffffa08e6338&amp;gt;] ldiskfs_journal_start_sb+0x58/0x90 [ldiskfs]
 [&amp;lt;ffffffffa072c017&amp;gt;] fsfilt_ldiskfs_start+0x77/0x5e0 [fsfilt_ldiskfs]
 [&amp;lt;ffffffffa07a9ac0&amp;gt;] llog_origin_handle_cancel+0x4b0/0xd70 [ptlrpc]
 [&amp;lt;ffffffffa076f71f&amp;gt;] ldlm_cancel_handler+0x1bf/0x5e0 [ptlrpc]
 [&amp;lt;ffffffffa079fb4e&amp;gt;] ptlrpc_main+0xc4e/0x1a40 [ptlrpc]
 [&amp;lt;ffffffffa079ef00&amp;gt;] ? ptlrpc_main+0x0/0x1a40 [ptlrpc]
 [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
 [&amp;lt;ffffffffa079ef00&amp;gt;] ? ptlrpc_main+0x0/0x1a40 [ptlrpc]
 [&amp;lt;ffffffffa079ef00&amp;gt;] ? ptlrpc_main+0x0/0x1a40 [ptlrpc]
 [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
INFO: task ldlm_cb_00:6302 blocked &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; more than 120 seconds.
&lt;span class=&quot;code-quote&quot;&gt;&quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot;&lt;/span&gt; disables &lt;span class=&quot;code-keyword&quot;&gt;this&lt;/span&gt; message.
ldlm_cb_00    D 0000000000000002     0  6302      2 0x00000080
 ffff881ec5265b20 0000000000000046 0000000000000000 000000ab00000000
 ffff881ec5265b50 ffffffff8129507e 3634333236363330 3134363536363336
 ffff881ec5263af8 ffff881ec5265fd8 000000000000fc40 ffff881ec5263af8
Call Trace:
 [&amp;lt;ffffffff8129507e&amp;gt;] ? number+0x2ee/0x320
 [&amp;lt;ffffffff8151ecc5&amp;gt;] rwsem_down_failed_common+0x95/0x1d0
 [&amp;lt;ffffffff8151ee23&amp;gt;] rwsem_down_write_failed+0x23/0x30
 [&amp;lt;ffffffff812992f3&amp;gt;] call_rwsem_down_write_failed+0x13/0x20
 [&amp;lt;ffffffff8151e322&amp;gt;] ? down_write+0x32/0x40
 [&amp;lt;ffffffffa09d543e&amp;gt;] dqacq_handler+0x35e/0xd20 [lquota]
 [&amp;lt;ffffffffa07b8486&amp;gt;] ? __req_capsule_get+0x176/0x750 [ptlrpc]
 [&amp;lt;ffffffffa07921e0&amp;gt;] ? lustre_swab_qdata+0x0/0x30 [ptlrpc]
 [&amp;lt;ffffffffa075e1d8&amp;gt;] target_handle_dqacq_callback+0x668/0xb90 [ptlrpc]
 [&amp;lt;ffffffffa09d50e0&amp;gt;] ? dqacq_handler+0x0/0xd20 [lquota]
 [&amp;lt;ffffffffa076df87&amp;gt;] ldlm_callback_handler+0xa17/0x1ff0 [ptlrpc]
 [&amp;lt;ffffffffa0503ea1&amp;gt;] ? libcfs_debug_msg+0x41/0x50 [libcfs]
 [&amp;lt;ffffffffa04ff4a4&amp;gt;] ? libcfs_id2str+0x74/0xb0 [libcfs]
 [&amp;lt;ffffffffa079fb4e&amp;gt;] ptlrpc_main+0xc4e/0x1a40 [ptlrpc]
 [&amp;lt;ffffffffa079ef00&amp;gt;] ? ptlrpc_main+0x0/0x1a40 [ptlrpc]
 [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
 [&amp;lt;ffffffffa079ef00&amp;gt;] ? ptlrpc_main+0x0/0x1a40 [ptlrpc]
 [&amp;lt;ffffffffa079ef00&amp;gt;] ? ptlrpc_main+0x0/0x1a40 [ptlrpc]
 [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
INFO: task ldlm_cb_01:6303 blocked &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; more than 120 seconds.
&lt;span class=&quot;code-quote&quot;&gt;&quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot;&lt;/span&gt; disables &lt;span class=&quot;code-keyword&quot;&gt;this&lt;/span&gt; message.
ldlm_cb_01    D 000000000000000d     0  6303      2 0x00000080
 ffff881ec5267b20 0000000000000046 0000000000000000 000000ab00000000
 ffff881ec5267b50 ffffffff8129507e ffff881ec5267ad0 000000005c2ae174
 ffff881ec5263098 ffff881ec5267fd8 000000000000fc40 ffff881ec5263098
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>lustre: 2.1.5&lt;br/&gt;
kernel: 2.6.32-279.19.1.el6.20130516.x86_64.lustre215&lt;br/&gt;
build:  2nasS_ofed154&lt;br/&gt;
&lt;br/&gt;
SRC at &lt;a href=&quot;https://github.com/jlan/lustre-nas&quot;&gt;https://github.com/jlan/lustre-nas&lt;/a&gt;&lt;br/&gt;
</environment>
        <key id="24688">LU-5052</key>
            <summary>threads stuck in jbd2_journal_start</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Mon, 12 May 2014 20:34:06 +0000</created>
                <updated>Thu, 30 Apr 2015 23:58:55 +0000</updated>
                            <resolved>Thu, 30 Apr 2015 23:58:55 +0000</resolved>
                                    <version>Lustre 2.4.1</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="83938" author="pjones" created="Mon, 12 May 2014 22:14:50 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Does this appear to be a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4794&quot; title=&quot;MDS threads all stuck in jbd2_journal_start&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4794&quot;&gt;&lt;del&gt;LU-4794&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="83966" author="bfaccini" created="Tue, 13 May 2014 08:38:14 +0000"  >&lt;p&gt;Bobi, &lt;br/&gt;
according to the full stacks traces dumped in dmesg, it looks more like a dup of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4271&quot; title=&quot;mds load goes very high and filesystem hangs after mounting mdt&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4271&quot;&gt;&lt;del&gt;LU-4271&lt;/del&gt;&lt;/a&gt;, still not proven has being a dup of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4794&quot; title=&quot;MDS threads all stuck in jbd2_journal_start&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4794&quot;&gt;&lt;del&gt;LU-4794&lt;/del&gt;&lt;/a&gt; itself, what do you think ?&lt;/p&gt;</comment>
                            <comment id="83968" author="bobijam" created="Tue, 13 May 2014 10:21:31 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4794&quot; title=&quot;MDS threads all stuck in jbd2_journal_start&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4794&quot;&gt;&lt;del&gt;LU-4794&lt;/del&gt;&lt;/a&gt; relates to llog handling get/journal transaction deadlock. And in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4794&quot; title=&quot;MDS threads all stuck in jbd2_journal_start&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4794&quot;&gt;&lt;del&gt;LU-4794&lt;/del&gt;&lt;/a&gt; bt-all.merged.txt, there also have similar thread stack trace just like the 2 threads you posted here.&lt;/p&gt;</comment>
                            <comment id="113941" author="mhanafi" created="Thu, 30 Apr 2015 22:22:39 +0000"  >&lt;p&gt;Please close&lt;/p&gt;</comment>
                            <comment id="113952" author="pjones" created="Thu, 30 Apr 2015 23:58:55 +0000"  >&lt;p&gt;ok - thanks Mahmoud&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="23814">LU-4794</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="14903" name="service200.gz" size="145140" author="mhanafi" created="Mon, 12 May 2014 20:34:06 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwmd3:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>13955</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>