<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:23:49 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2272] BUG: spinlock cpu recursion on CPU#2, ll_sa_30972/30992</title>
                <link>https://jira.whamcloud.com/browse/LU-2272</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Running racer with a debugging kernel on master I hit this condition:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 8529.226634] BUG: spinlock cpu recursion on CPU#2, ll_sa_30972/30992 (Not tainted)
[ 8529.227125]  lock: ffff88009cb38eb8, .magic: dead4ead, .owner: ptlrpcd_2/7457, .owner_cpu: 2
[ 8529.227595] Pid: 30992, comm: ll_sa_30972 Not tainted 2.6.32-debug #6
[ 8529.227874] Call Trace:
[ 8529.228084]  [&amp;lt;ffffffff8128098a&amp;gt;] ? spin_bug+0xaa/0x100
[ 8529.228342]  [&amp;lt;ffffffff81280ba1&amp;gt;] ? _raw_spin_lock+0x121/0x180
[ 8529.228610]  [&amp;lt;ffffffff814fafde&amp;gt;] ? _spin_lock+0xe/0x10
[ 8529.228892]  [&amp;lt;ffffffffa0d3192c&amp;gt;] ? do_statahead_interpret+0x4c/0xdd0 [lustre]
[ 8529.229426]  [&amp;lt;ffffffff8109011c&amp;gt;] ? remove_wait_queue+0x3c/0x50
[ 8529.229718]  [&amp;lt;ffffffffa0d3690a&amp;gt;] ? ll_statahead_thread+0xcda/0xf40 [lustre]
[ 8529.230008]  [&amp;lt;ffffffff81057d60&amp;gt;] ? default_wake_function+0x0/0x20
[ 8529.230293]  [&amp;lt;ffffffffa0d35c30&amp;gt;] ? ll_statahead_thread+0x0/0xf40 [lustre]
[ 8529.230577]  [&amp;lt;ffffffff8100c14a&amp;gt;] ? child_rip+0xa/0x20
[ 8529.230844]  [&amp;lt;ffffffffa0d35c30&amp;gt;] ? ll_statahead_thread+0x0/0xf40 [lustre]
[ 8529.231142]  [&amp;lt;ffffffffa0d35c30&amp;gt;] ? ll_statahead_thread+0x0/0xf40 [lustre]
[ 8529.231429]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="16561">LU-2272</key>
            <summary>BUG: spinlock cpu recursion on CPU#2, ll_sa_30972/30992</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="green">Oleg Drokin</reporter>
                        <labels>
                    </labels>
                <created>Sat, 3 Nov 2012 20:28:48 +0000</created>
                <updated>Fri, 11 Dec 2015 15:49:07 +0000</updated>
                            <resolved>Sun, 22 Sep 2013 13:47:21 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                                    <fixVersion>Lustre 2.7.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>9</watches>
                                                                            <comments>
                            <comment id="47366" author="green" created="Sat, 3 Nov 2012 20:29:55 +0000"  >&lt;p&gt;Seems to be related to statahead, so FanYong, can you please take a look?&lt;/p&gt;</comment>
                            <comment id="47370" author="yong.fan" created="Sun, 4 Nov 2012 00:40:14 +0000"  >&lt;p&gt;OK, try to reproduce by myself and dump the log.&lt;/p&gt;</comment>
                            <comment id="49077" author="green" created="Tue, 11 Dec 2012 15:24:15 +0000"  >&lt;p&gt;I just had this hit again in my racer testing on veryfresh master:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Dec 11 15:15:42 centos6-8 kernel: [226594.953228] BUG: spinlock cpu recursion on CPU#0, ll_sa_13669/13959 (Not tainted)
Dec 11 15:15:42 centos6-8 kernel: [226594.953702]  lock: ffff880018c19eb8, .magic: dead4ead, .owner: ptlrpcd_2/26580, .owner_cpu: 0
Dec 11 15:15:42 centos6-8 kernel: [226594.954248] Pid: 13959, comm: ll_sa_13669 Not tainted 2.6.32-debug #6
Dec 11 15:15:42 centos6-8 kernel: [226594.954815] Call Trace:
Dec 11 15:15:42 centos6-8 kernel: [226594.955034]  [&amp;lt;ffffffff8128098a&amp;gt;] ? spin_bug+0xaa/0x100
Dec 11 15:15:42 centos6-8 kernel: [226594.955285]  [&amp;lt;ffffffff81280ba1&amp;gt;] ? _raw_spin_lock+0x121/0x180
Dec 11 15:15:42 centos6-8 kernel: [226594.955548]  [&amp;lt;ffffffff814fafde&amp;gt;] ? _spin_lock+0xe/0x10
Dec 11 15:15:42 centos6-8 kernel: [226594.955851]  [&amp;lt;ffffffffa0e368dc&amp;gt;] ? do_statahead_interpret+0x4c/0xdd0 [lustre]
Dec 11 15:15:42 centos6-8 kernel: [226594.957300]  [&amp;lt;ffffffff8109011c&amp;gt;] ? remove_wait_queue+0x3c/0x50
Dec 11 15:15:42 centos6-8 kernel: [226594.957612]  [&amp;lt;ffffffffa0e3b90a&amp;gt;] ? ll_statahead_thread+0xcda/0xf40 [lustre]
Dec 11 15:15:42 centos6-8 kernel: [226594.957977]  [&amp;lt;ffffffff81057d60&amp;gt;] ? default_wake_function+0x0/0x20
Dec 11 15:15:42 centos6-8 kernel: [226594.958317]  [&amp;lt;ffffffffa0e3ac30&amp;gt;] ? ll_statahead_thread+0x0/0xf40 [lustre]
Dec 11 15:15:42 centos6-8 kernel: [226594.959502]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="58980" author="green" created="Tue, 21 May 2013 15:49:36 +0000"  >&lt;p&gt;Ok, I finally got to the root of it.&lt;br/&gt;
The reason we got it is in ll_statahead_interpret we sleep under spinlock:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;crash&amp;gt; bt 21485
PID: 21485  TASK: ffff8800b2906540  CPU: 7   COMMAND: &quot;ptlrpcd_4&quot;
 #0 [ffff8800b098f930] schedule at ffffffff814fae3a
 #1 [ffff8800b098f9f8] __cond_resched at ffffffff810644ea
 #2 [ffff8800b098fa18] _cond_resched at ffffffff814fb840
 #3 [ffff8800b098fa28] __kmalloc at ffffffff811686d0
 #4 [ffff8800b098fa78] cfs_alloc at ffffffffa0b0cb90 [libcfs]
 #5 [ffff8800b098faa8] ldlm_bl_to_thread at ffffffffa1268cc1 [ptlrpc]
 #6 [ffff8800b098fbb8] ldlm_bl_to_thread_lock at ffffffffa1269219 [ptlrpc]
 #7 [ffff8800b098fbc8] ldlm_lock_decref_internal at ffffffffa1246ccd [ptlrpc]
 #8 [ffff8800b098fc28] ldlm_lock_decref at ffffffffa1247d69 [ptlrpc]
 #9 [ffff8800b098fc58] ll_intent_drop_lock at ffffffffa07dac8d [lustre]
#10 [ffff8800b098fc88] ll_statahead_interpret at ffffffffa0838e66 [lustre]
#11 [ffff8800b098fce8] mdc_intent_getattr_async_interpret at ffffffffa0dea4a2 [mdc]
#12 [ffff8800b098fd68] ptlrpc_check_set at ffffffffa12804e2 [ptlrpc]
#13 [ffff8800b098fe08] ptlrpcd_check at ffffffffa12adc5b [ptlrpc]
#14 [ffff8800b098fe68] ptlrpcd at ffffffffa12ae1a3 [ptlrpc]
#15 [ffff8800b098ff48] kernel_thread at ffffffff8100c10a
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;While I mostly hit the warnings like in this ticket, right now I got a deadlock, and that&apos;s how I finally found this issue.&lt;br/&gt;
offending code:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;                        entry-&amp;gt;se_minfo = minfo;
                        entry-&amp;gt;se_req = ptlrpc_request_addref(req);
                        /* Release the async ibits lock ASAP to avoid deadlock
                         * when statahead thread tries to enqueue lock on parent
                         * for readpage and other tries to enqueue lock on child
                         * with parent&apos;s lock held, for example: unlink. */
                        entry-&amp;gt;se_handle = it-&amp;gt;d.lustre.it_lock_handle;
can sleep!!! =&amp;gt;         ll_intent_drop_lock(it);
                        wakeup = sa_received_empty(sai);
                        cfs_list_add_tail(&amp;amp;entry-&amp;gt;se_list,
                                          &amp;amp;sai-&amp;gt;sai_entries_received);
                }
                sai-&amp;gt;sai_replied++;
                spin_unlock(&amp;amp;lli-&amp;gt;lli_sa_lock);
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="58995" author="pjones" created="Tue, 21 May 2013 17:53:05 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;Are you able to advise on this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="59037" author="laisiyao" created="Wed, 22 May 2013 08:11:19 +0000"  >&lt;p&gt;The fix will modify the same code of patch for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3270&quot; title=&quot;ptlrpcd strnlen crash trying to log a message&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3270&quot;&gt;&lt;del&gt;LU-3270&lt;/del&gt;&lt;/a&gt;, so I based this fix on &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3270&quot; title=&quot;ptlrpcd strnlen crash trying to log a message&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3270&quot;&gt;&lt;del&gt;LU-3270&lt;/del&gt;&lt;/a&gt;: &lt;a href=&quot;http://review.whamcloud.com/#change,6413&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,6413&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="66156" author="laisiyao" created="Tue, 10 Sep 2013 05:06:28 +0000"  >&lt;p&gt;The above patch is abandoned, and the fix is included in &lt;a href=&quot;http://review.whamcloud.com/#/c/6392/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/6392/&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="67203" author="pjones" created="Sun, 22 Sep 2013 13:34:53 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;So can we duplicate this ticket into &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3270&quot; title=&quot;ptlrpcd strnlen crash trying to log a message&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3270&quot;&gt;&lt;del&gt;LU-3270&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="67204" author="laisiyao" created="Sun, 22 Sep 2013 13:42:45 +0000"  >&lt;p&gt;Yes, Peter. &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3270&quot; title=&quot;ptlrpcd strnlen crash trying to log a message&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3270&quot;&gt;&lt;del&gt;LU-3270&lt;/del&gt;&lt;/a&gt; fixed a number of statahead bugs which including this one.&lt;/p&gt;</comment>
                            <comment id="67205" author="pjones" created="Sun, 22 Sep 2013 13:47:21 +0000"  >&lt;p&gt;ok thanks!&lt;/p&gt;</comment>
                            <comment id="107754" author="gerrit" created="Tue, 24 Feb 2015 08:41:38 +0000"  >&lt;p&gt;Jian Yu (jian.yu@intel.com) uploaded a new patch: &lt;a href=&quot;http://review.whamcloud.com/13846&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/13846&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2272&quot; title=&quot;BUG: spinlock cpu recursion on CPU#2, ll_sa_30972/30992&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2272&quot;&gt;&lt;del&gt;LU-2272&lt;/del&gt;&lt;/a&gt; statahead: ll_intent_drop_lock() called in spinlock&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_5&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 668bbb377ab45b9e863844406682c865de684b66&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                                <inwardlinks description="is related to">
                                                        </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvbnj:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>5431</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>