<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:00:18 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-6447] mdt_identity_upcall calls sleeping function under rwlock</title>
                <link>https://jira.whamcloud.com/browse/LU-6447</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Running on RHEL7.1 with CONFIG_DEBUG_SLEEP_ATOMIC enabled caught this gem:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Mar 27 21:12:13 centos6-16 kernel: BUG: sleeping function called from invalid context at mm/slab.c:3054
Mar 27 21:12:13 centos6-16 kernel: in_atomic(): 1, irqs_disabled(): 0, pid: 19599, name: mdt00_001
Mar 27 21:12:13 centos6-16 kernel: 1 lock held by mdt00_001/19599:
Mar 27 21:12:13 centos6-16 kernel: #0:  (&amp;amp;cache-&amp;gt;uc_upcall_rwlock){......}, at: [&amp;lt;ffffffffa0b15ad1&amp;gt;] mdt_identity_do_upcall+0x91/0x470 [mdt]
Mar 27 21:12:13 centos6-16 kernel: CPU: 3 PID: 19599 Comm: mdt00_001 Tainted: GF       W  O--------------   3.10.0-debug #5
Mar 27 21:12:13 centos6-16 kernel: Hardware name: Bochs Bochs, BIOS Bochs 01/01/2011
Mar 27 21:12:13 centos6-16 kernel: ffff8800808945c0 000000006b10abfb ffff88008b1eb808 ffffffff816ccb68
Mar 27 21:12:13 centos6-16 kernel: ffff88008b1eb820 ffffffff810a8fd9 0000000000000000 ffff88008b1eb8b8
Mar 27 21:12:13 centos6-16 kernel: ffffffff811bdeda ffff880074b48000 0000000000000246 0000000000000000
Mar 27 21:12:13 centos6-16 kernel: Call Trace:
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff816ccb68&amp;gt;] dump_stack+0x19/0x1b
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff810a8fd9&amp;gt;] __might_sleep+0xe9/0x110
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff811bdeda&amp;gt;] __kmalloc_track_caller+0x11a/0x620
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0b15b0b&amp;gt;] ? mdt_identity_do_upcall+0xcb/0x470 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff81182f91&amp;gt;] kstrdup+0x31/0x60
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0b15b0b&amp;gt;] mdt_identity_do_upcall+0xcb/0x470 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa02de48f&amp;gt;] upcall_cache_get_entry+0x2af/0x8e0 [obdclass]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa050ef87&amp;gt;] ? lustre_msg_buf+0x17/0x60 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0536882&amp;gt;] ? __req_capsule_get+0x162/0x710 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa05116cf&amp;gt;] ? lustre_pack_reply_flags+0x6f/0x1e0 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0b16437&amp;gt;] mdt_identity_get+0x17/0x50 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0af921a&amp;gt;] mdt_init_ucred_reint+0x23a/0x380 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0ae9dcb&amp;gt;] mdt_reint_internal+0x24b/0x760 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0aea442&amp;gt;] mdt_intent_reint+0x162/0x400 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa0af447a&amp;gt;] mdt_intent_policy+0x57a/0xbe0 [mdt]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa04c6f66&amp;gt;] ldlm_lock_enqueue+0x326/0x900 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa014f505&amp;gt;] ? cfs_hash_rw_unlock+0x15/0x20 [libcfs]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa04ed672&amp;gt;] ldlm_handle_enqueue0+0x502/0x1520 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa05135b0&amp;gt;] ? lustre_swab_ldlm_lock_desc+0x30/0x30 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa05670e2&amp;gt;] tgt_enqueue+0x62/0x210 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa056b5c5&amp;gt;] tgt_request_handle+0x645/0xfe0 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa051c881&amp;gt;] ptlrpc_server_handle_request+0x231/0xab0 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa051a3f8&amp;gt;] ? ptlrpc_wait_event+0xb8/0x360 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa05207d0&amp;gt;] ptlrpc_main+0xae0/0x1ee0 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff816d5b97&amp;gt;] ? _raw_spin_unlock_irq+0x27/0x50
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff816d38be&amp;gt;] ? __schedule+0x2fe/0x810
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffffa051fcf0&amp;gt;] ? ptlrpc_register_service+0xf20/0xf20 [ptlrpc]
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff8109c00a&amp;gt;] kthread+0xea/0xf0
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff8109bf20&amp;gt;] ? kthread_create_on_node+0x140/0x140
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff816df2bc&amp;gt;] ret_from_fork+0x7c/0xb0
Mar 27 21:12:13 centos6-16 kernel: [&amp;lt;ffffffff8109bf20&amp;gt;] ? kthread_create_on_node+0x140/0x140
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="29459">LU-6447</key>
            <summary>mdt_identity_upcall calls sleeping function under rwlock</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="niu">Niu Yawei</assignee>
                                    <reporter username="green">Oleg Drokin</reporter>
                        <labels>
                            <label>llnl</label>
                    </labels>
                <created>Fri, 10 Apr 2015 02:26:58 +0000</created>
                <updated>Thu, 16 Feb 2017 20:49:21 +0000</updated>
                            <resolved>Thu, 11 Aug 2016 12:09:30 +0000</resolved>
                                                    <fixVersion>Lustre 2.9.0</fixVersion>
                                        <due></due>
                            <votes>1</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="111885" author="gerrit" created="Fri, 10 Apr 2015 02:32:43 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) uploaded a new patch: &lt;a href=&quot;http://review.whamcloud.com/14432&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/14432&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6447&quot; title=&quot;mdt_identity_upcall calls sleeping function under rwlock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6447&quot;&gt;&lt;del&gt;LU-6447&lt;/del&gt;&lt;/a&gt; mdt: mdt_identity_upcall to not block with rwlock held&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 912a0861bc6fff558483a58bc29cad76c7ae4681&lt;/p&gt;</comment>
                            <comment id="111886" author="green" created="Fri, 10 Apr 2015 02:33:51 +0000"  >&lt;p&gt;This is my first stab at the problem unless somebody has better ideas&lt;/p&gt;</comment>
                            <comment id="154466" author="dinatale2" created="Thu, 2 Jun 2016 17:17:47 +0000"  >&lt;p&gt;We&apos;ve started seeing a very similar call stack with the same error in a testbed we&apos;ve stood up.&lt;/p&gt;</comment>
                            <comment id="154480" author="green" created="Thu, 2 Jun 2016 17:41:02 +0000"  >&lt;p&gt;Yes, it&apos;s a problem on rhel7 with debug atomic sleep option enabled.&lt;br/&gt;
I am carrying my patch referenced above even though it&apos;s not perfect meanwhile to reduce amount of noise in my logs.&lt;/p&gt;</comment>
                            <comment id="156575" author="morrone" created="Wed, 22 Jun 2016 21:16:55 +0000"  >&lt;p&gt;This seems to be implicated in long (15 second) hangs that I am sometimes seeing when poking around the lustre filesystem interactively.  That is going to be a big issue for our hotline when 2.8 goes live, so we really need a fix.  I would this should be on the docket for fixing before 2.9 comes out.&lt;/p&gt;</comment>
                            <comment id="158392" author="pjones" created="Mon, 11 Jul 2016 22:00:25 +0000"  >&lt;p&gt;Niu&lt;/p&gt;

&lt;p&gt;Could you please refresh Oleg&apos;s patch to address the existing concerns?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="161560" author="gerrit" created="Thu, 11 Aug 2016 05:52:23 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;http://review.whamcloud.com/14432/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/14432/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6447&quot; title=&quot;mdt_identity_upcall calls sleeping function under rwlock&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6447&quot;&gt;&lt;del&gt;LU-6447&lt;/del&gt;&lt;/a&gt; mdt: mdt_identity_upcall to not block with rwlock held&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: e8273a3dd71c4e6ab5ca9de3fbfbc0f7603d6930&lt;/p&gt;</comment>
                            <comment id="161588" author="pjones" created="Thu, 11 Aug 2016 12:09:30 +0000"  >&lt;p&gt;Landed for 2.9&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzxai7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>