<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:01:29 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-13462] MDS deadlocks in osd_read_lock()</title>
                <link>https://jira.whamcloud.com/browse/LU-13462</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;MDS deadlocked&lt;/p&gt;

&lt;p&gt;Similar to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13073&quot; title=&quot;Multiple MDS deadlocks (in lod_qos_prep_create) after OSS crash&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13073&quot;&gt;&lt;del&gt;LU-13073&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;

 12287155.058187] LNet: Service thread pid 15312 was inactive &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; 550.48s. The thread might be hung, or it might only be slow and will resume later. Dumping the stack trace &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; debugging purposes:
[12287155.109703] LNet: Skipped 2 previous similar messages
[12287155.125609]  [&amp;lt;ffffffffa5f87398&amp;gt;] call_rwsem_down_read_failed+0x18/0x30
[12287155.130583]  [&amp;lt;ffffffffc144acfc&amp;gt;] osd_read_lock+0x5c/0xe0 [osd_ldiskfs]
[12287155.130612]  [&amp;lt;ffffffffc16f28ea&amp;gt;] lod_read_lock+0x3a/0xd0 [lod]
[12287155.130625]  [&amp;lt;ffffffffc17779aa&amp;gt;] mdd_read_lock+0x3a/0xd0 [mdd]
[12287155.130632]  [&amp;lt;ffffffffc177d730&amp;gt;] mdd_xattr_get+0x70/0x5c0 [mdd]
[12287155.130648]  [&amp;lt;ffffffffc15e6ea6&amp;gt;] mdt_stripe_get+0xd6/0x400 [mdt]
[12287155.130657]  [&amp;lt;ffffffffc15e7a2d&amp;gt;] mdt_attr_get_complex+0x46d/0x850 [mdt]
[12287155.130665]  [&amp;lt;ffffffffc15e800c&amp;gt;] mdt_getattr_internal+0x1fc/0xf60 [mdt]
[12287155.130673]  [&amp;lt;ffffffffc15ebd60&amp;gt;] mdt_getattr_name_lock+0x950/0x1c30 [mdt]
[12287155.130681]  [&amp;lt;ffffffffc15f3c05&amp;gt;] mdt_intent_getattr+0x2b5/0x480 [mdt]
[12287155.130691]  [&amp;lt;ffffffffc15f0a18&amp;gt;] mdt_intent_policy+0x2e8/0xd00 [mdt]
[12287155.130736]  [&amp;lt;ffffffffc0f2dd26&amp;gt;] ldlm_lock_enqueue+0x366/0xa60 [ptlrpc]
[12287155.130769]  [&amp;lt;ffffffffc0f56587&amp;gt;] ldlm_handle_enqueue0+0xa47/0x15a0 [ptlrpc]
[12287155.130815]  [&amp;lt;ffffffffc0fde882&amp;gt;] tgt_enqueue+0x62/0x210 [ptlrpc]
[12287155.130853]  [&amp;lt;ffffffffc0fe31da&amp;gt;] tgt_request_handle+0xaea/0x1580 [ptlrpc]
[12287155.130887]  [&amp;lt;ffffffffc0f8880b&amp;gt;] ptlrpc_server_handle_request+0x24b/0xab0 [ptlrpc]
[12287155.130921]  [&amp;lt;ffffffffc0f8c13c&amp;gt;] ptlrpc_main+0xafc/0x1fc0 [ptlrpc]
[12287155.130925]  [&amp;lt;ffffffffa5cc1da1&amp;gt;] kthread+0xd1/0xe0
[12287155.130929]  [&amp;lt;ffffffffa6375c37&amp;gt;] ret_from_fork_nospec_end+0x0/0x39
[12287155.130947]  [&amp;lt;ffffffffffffffff&amp;gt;] 0xffffffffffffffff
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="58816">LU-13462</key>
            <summary>MDS deadlocks in osd_read_lock()</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Sat, 18 Apr 2020 02:54:58 +0000</created>
                <updated>Mon, 25 Jul 2022 18:38:52 +0000</updated>
                            <resolved>Mon, 25 Jul 2022 18:38:52 +0000</resolved>
                                    <version>Lustre 2.12.2</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="267937" author="pjones" created="Sat, 18 Apr 2020 13:00:01 +0000"  >&lt;p&gt;Mahmoud&lt;/p&gt;

&lt;p&gt;Could you please supply details of the kernel version that you are running?&lt;/p&gt;

&lt;p&gt;Yang Sheng&lt;/p&gt;

&lt;p&gt;Could you please advise&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="267952" author="ys" created="Sat, 18 Apr 2020 15:03:34 +0000"  >&lt;p&gt;Hi, Mahmoud,&lt;/p&gt;


&lt;p&gt;Could you please provide more info? What do you mean for similar &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13073&quot; title=&quot;Multiple MDS deadlocks (in lod_qos_prep_create) after OSS crash&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13073&quot;&gt;&lt;del&gt;LU-13073&lt;/del&gt;&lt;/a&gt;? &lt;/p&gt;

&lt;p&gt;Thanks,&lt;br/&gt;
Yangsheng&lt;/p&gt;</comment>
                            <comment id="268078" author="mhanafi" created="Mon, 20 Apr 2020 17:32:34 +0000"  >&lt;p&gt;The stack trace for hung threads is the same as &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13073&quot; title=&quot;Multiple MDS deadlocks (in lod_qos_prep_create) after OSS crash&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13073&quot;&gt;&lt;del&gt;LU-13073&lt;/del&gt;&lt;/a&gt;. But in our case we didn&apos;t have a OSS crash&lt;/p&gt;

&lt;p&gt;Our kernel is: 3.10.0-957.21.3.el7_lustre212.x86_64&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="268347" author="ys" created="Thu, 23 Apr 2020 13:26:20 +0000"  >&lt;p&gt;Then have any possible to provide sysrq-t info? From stack trace i don&apos;t think it same as lu-13073.&lt;/p&gt;</comment>
                            <comment id="268392" author="mhanafi" created="Thu, 23 Apr 2020 17:04:03 +0000"  >&lt;p&gt;Attached the stack trace.&lt;/p&gt;</comment>
                            <comment id="268450" author="ys" created="Fri, 24 Apr 2020 03:17:17 +0000"  >&lt;p&gt;Hi, Mahmoud,&lt;/p&gt;

&lt;p&gt;The log you attached really duplicated with &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13073&quot; title=&quot;Multiple MDS deadlocks (in lod_qos_prep_create) after OSS crash&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13073&quot;&gt;&lt;del&gt;LU-13073&lt;/del&gt;&lt;/a&gt;. But it is different with which you pasted stackstrace. You pasted log shows thread stuck on osd_read_lock. This most was caused by some local filesystem issue. But the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13073&quot; title=&quot;Multiple MDS deadlocks (in lod_qos_prep_create) after OSS crash&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13073&quot;&gt;&lt;del&gt;LU-13073&lt;/del&gt;&lt;/a&gt; is not. It is a long outstanding issue caused by OSS. &lt;/p&gt;

&lt;p&gt;Thanks,&lt;br/&gt;
YangSheng&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="57632">LU-13073</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="34746" name="s.600.Apr17.2020_crash.bt.all" size="1549666" author="mhanafi" created="Thu, 23 Apr 2020 17:04:19 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00y7b:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10021"><![CDATA[2]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>