<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:34:45 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10402] Service thread hung at jbd2_journal_start</title>
                <link>https://jira.whamcloud.com/browse/LU-10402</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;OSS started to become unresponsive with lots of strack traces.&lt;/p&gt;

&lt;p&gt;First stack trace was&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;4&amp;gt;LNet: Service thread pid 30365 was inactive &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; 962.00s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; debugging purposes:
&amp;lt;4&amp;gt;LNet: Skipped 4 previous similar messages
&amp;lt;4&amp;gt;Pid: 30365, comm: ll_ost_io00_100
&amp;lt;4&amp;gt;
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffff810a3f5e&amp;gt;] ? prepare_to_wait+0x4e/0x80
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0df0fca&amp;gt;] start_this_handle+0x25a/0x480 [jbd2]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff810a3c30&amp;gt;] ? autoremove_wake_function+0x0/0x40
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0df13d5&amp;gt;] jbd2_journal_start+0xb5/0x100 [jbd2]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0e49b86&amp;gt;] ldiskfs_journal_start_sb+0x56/0xe0 [ldiskfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0f08ebf&amp;gt;] osd_trans_start+0x1df/0x660 [osd_ldiskfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa10ac4e5&amp;gt;] ofd_write_attr_set+0x2c5/0x8c0 [ofd]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa10ad4c6&amp;gt;] ofd_commitrw_write+0x256/0x11a0 [ofd]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa10b47ad&amp;gt;] ? ofd_fmd_find_nolock+0xad/0xd0 [ofd]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa10ae9c3&amp;gt;] ofd_commitrw+0x5b3/0xba0 [ofd]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa07045a1&amp;gt;] ? lprocfs_counter_add+0x151/0x1c0 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09b438d&amp;gt;] obd_commitrw.clone.0+0x11d/0x390 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09bc299&amp;gt;] tgt_brw_write+0xc69/0x1520 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa090dd10&amp;gt;] ? target_bulk_timeout+0x0/0xc0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09baece&amp;gt;] tgt_request_handle+0x8be/0x1020 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0964ca1&amp;gt;] ptlrpc_main+0xf41/0x1a80 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0963d60&amp;gt;] ? ptlrpc_main+0x0/0x1a80 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff810a379e&amp;gt;] kthread+0x9e/0xc0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c28a&amp;gt;] child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffff810a3700&amp;gt;] ? kthread+0x0/0xc0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c280&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;I will attach bt for all threads.&lt;/p&gt;

&lt;p&gt;Is this a dup of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6918&quot; title=&quot;Deadlock on transaction with iget()/clear_inode()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6918&quot;&gt;&lt;del&gt;LU-6918&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;</description>
                <environment>Lustre 2.7.3 fe</environment>
        <key id="49772">LU-10402</key>
            <summary>Service thread hung at jbd2_journal_start</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Fri, 15 Dec 2017 20:43:08 +0000</created>
                <updated>Sat, 16 Jun 2018 13:53:06 +0000</updated>
                            <resolved>Sat, 16 Jun 2018 13:53:06 +0000</resolved>
                                    <version>Lustre 2.7.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="216626" author="pjones" created="Mon, 18 Dec 2017 18:10:37 +0000"  >&lt;p&gt;Yang Sheng&lt;/p&gt;

&lt;p&gt;Can you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="216683" author="ys" created="Tue, 19 Dec 2017 02:57:35 +0000"  >&lt;p&gt;From stack trace:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;ID: 22328  TASK: ffff881b2cbed520  CPU: 5   COMMAND: &quot;ll_ost00_003&quot;
 #0 [ffff881b2cbf3630] schedule at ffffffff81581292
 #1 [ffff881b2cbf3708] __wait_on_freeing_inode at ffffffff811b1f78
 #2 [ffff881b2cbf3778] find_inode_fast at ffffffff811b1ff8
 #3 [ffff881b2cbf37a8] ifind_fast at ffffffff811b315c
 #4 [ffff881b2cbf37d8] iget_locked at ffffffff811b33f9
 #5 [ffff881b2cbf3818] ldiskfs_iget at ffffffffa0e247b7 [ldiskfs]
 #6 [ffff881b2cbf3888] osd_iget at ffffffffa0f04d4e [osd_ldiskfs]
 #7 [ffff881b2cbf38b8] osd_obj_map_lookup at ffffffffa0f34743 [osd_ldiskfs]
 #8 [ffff881b2cbf3938] osd_oi_lookup at ffffffffa0f2117a [osd_ldiskfs]
 #9 [ffff881b2cbf3968] osd_object_init at ffffffffa0f16499 [osd_ldiskfs]
#10 [ffff881b2cbf3a48] lu_object_alloc at ffffffffa0729e18 [obdclass]
#11 [ffff881b2cbf3aa8] lu_object_find_try at ffffffffa072b361 [obdclass]
#12 [ffff881b2cbf3b38] lu_object_find_at at ffffffffa072b521 [obdclass]
#13 [ffff881b2cbf3bc8] lu_object_find at ffffffffa072b566 [obdclass]
#14 [ffff881b2cbf3bd8] ofd_object_find at ffffffffa10a5aa5 [ofd]
#15 [ffff881b2cbf3c08] ofd_lvbo_init at ffffffffa10b977f [ofd]
#16 [ffff881b2cbf3cb8] ldlm_handle_enqueue0 at ffffffffa09308dd [ptlrpc]
#17 [ffff881b2cbf3d28] tgt_enqueue at ffffffffa09b9eb1 [ptlrpc]
#18 [ffff881b2cbf3d48] tgt_request_handle at ffffffffa09baece [ptlrpc]
#19 [ffff881b2cbf3da8] ptlrpc_main at ffffffffa0964ca1 [ptlrpc]
#20 [ffff881b2cbf3ee8] kthread at ffffffff810a379e
#21 [ffff881b2cbf3f48] kernel_thread at ffffffff8
...............
PID: 61556  TASK: ffff8804b009a040  CPU: 8   COMMAND: &quot;perfquery&quot;
 #0 [ffff8804b009f5a8] schedule at ffffffff81581292
 #1 [ffff8804b009f680] start_this_handle at ffffffffa0df0fca [jbd2]
 #2 [ffff8804b009f740] jbd2_journal_start at ffffffffa0df13d5 [jbd2]
 #3 [ffff8804b009f780] ldiskfs_journal_start_sb at ffffffffa0e49b86 [ldiskfs]
 #4 [ffff8804b009f7a0] ldiskfs_dquot_drop at ffffffffa0e49f15 [ldiskfs]
 #5 [ffff8804b009f7d0] vfs_dq_drop at ffffffff811f7ca2
 #6 [ffff8804b009f7e0] clear_inode at ffffffff811b2623
 #7 [ffff8804b009f800] dispose_list at ffffffff811b2710
 #8 [ffff8804b009f840] shrink_icache_memory at ffffffff811b2a64
 #9 [ffff8804b009f8a0] shrink_slab at ffffffff8114253a
#10 [ffff8804b009f900] do_try_to_free_pages at ffffffff811448df
#11 [ffff8804b009f9a0] try_to_free_pages at ffffffff81144d85
#12 [ffff8804b009fa50] __alloc_pages_nodemask at ffffffff81138d8d
#13 [ffff8804b009fba0] alloc_pages_current at ffffffff8117255a
#14 [ffff8804b009fbd0] __get_free_pages at ffffffff8113655e
#15 [ffff8804b009fbe0] get_zeroed_page at ffffffff811365b6
#16 [ffff8804b009fbf0] sysfs_follow_link at ffffffff81215136
#17 [ffff8804b009fc50] __link_path_walk at ffffffff811a4f26
#18 [ffff8804b009fd30] path_walk at ffffffff811a5e0a
#19 [ffff8804b009fd70] filename_lookup at ffffffff811a601b
#20 [ffff8804b009fdb0] do_filp_open at ffffffff811a74f4
#21 [ffff8804b009ff20] do_sys_open at ffffffff81191607
#22 [ffff8804b009ff70] sys_open at ffffffff81191710
#23 [ffff8804b009ff80] system_call_fastpath at ffffffff8100b0d2
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;It is really duplicated with &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6918&quot; title=&quot;Deadlock on transaction with iget()/clear_inode()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6918&quot;&gt;&lt;del&gt;LU-6918&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;Thanks,&lt;br/&gt;
YangSheng&lt;/p&gt;</comment>
                            <comment id="216720" author="pjones" created="Tue, 19 Dec 2017 14:31:38 +0000"  >&lt;p&gt;As per Alex, &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6918&quot; title=&quot;Deadlock on transaction with iget()/clear_inode()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6918&quot;&gt;&lt;del&gt;LU-6918&lt;/del&gt;&lt;/a&gt; was a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6969&quot; title=&quot;osd_internal.h:1090:osd_trans_exec_check()) LBUG for osd_index_ea_delete()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6969&quot;&gt;&lt;del&gt;LU-6969&lt;/del&gt;&lt;/a&gt; so this issue should be fixed in more current releases&lt;/p&gt;</comment>
                            <comment id="229585" author="mhanafi" created="Thu, 14 Jun 2018 19:59:23 +0000"  >&lt;p&gt;This can be closed&lt;/p&gt;</comment>
                            <comment id="229590" author="pjones" created="Sat, 16 Jun 2018 13:53:06 +0000"  >&lt;p&gt;Thanks Mahmoud&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="28946" name="bt.all" size="1374469" author="mhanafi" created="Fri, 15 Dec 2017 20:42:44 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzpmv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10021"><![CDATA[2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>