<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:40:33 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-4197] deadlock in recovery</title>
                <link>https://jira.whamcloud.com/browse/LU-4197</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Bug originally hit during xyratex testing.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;BUG: spinlock lockup on CPU#3, tgt_recov/8159, ffff880099c1ca90 (Tainted: G        W  ----------------  )
Pid: 8159, comm: tgt_recov Tainted: G        W  ----------------   2.6.32-131.17.1-lustre #0
Call Trace:
 [&amp;lt;ffffffff8128c2da&amp;gt;] ? _raw_spin_lock+0x16a/0x180
 [&amp;lt;ffffffff81500ff6&amp;gt;] ? _spin_lock+0x56/0x70
 [&amp;lt;ffffffffa056668a&amp;gt;] ? class_export_recovery_cleanup+0x3a/0x230 [obdclass]
 [&amp;lt;ffffffffa03ea572&amp;gt;] ? cfs_hash_del+0xa2/0x1d0 [libcfs]
 [&amp;lt;ffffffffa056668a&amp;gt;] ? class_export_recovery_cleanup+0x3a/0x230 [obdclass]
 [&amp;lt;ffffffffa056875d&amp;gt;] ? class_disconnect+0x15d/0x3d0 [obdclass]
 [&amp;lt;ffffffffa06bfd17&amp;gt;] ? server_disconnect_export+0x37/0x1a0 [ptlrpc]
 [&amp;lt;ffffffffa0c9630f&amp;gt;] ? filter_disconnect+0xbf/0x380 [obdfilter]
 [&amp;lt;ffffffffa056db97&amp;gt;] ? class_disconnect_export_list+0x347/0x680 [obdclass]
 [&amp;lt;ffffffffa056e027&amp;gt;] ? class_disconnect_stale_exports+0x157/0x380 [obdclass]
 [&amp;lt;ffffffffa06bc180&amp;gt;] ? exp_connect_healthy+0x0/0x20 [ptlrpc]
 [&amp;lt;ffffffffa06bc490&amp;gt;] ? check_for_clients+0x0/0x80 [ptlrpc]
 [&amp;lt;ffffffffa06bf04b&amp;gt;] ? target_recovery_overseer+0x15b/0x2d0 [ptlrpc]
 [&amp;lt;ffffffffa06bc180&amp;gt;] ? exp_connect_healthy+0x0/0x20 [ptlrpc]
 [&amp;lt;ffffffff81091a80&amp;gt;] ? autoremove_wake_function+0x0/0x40
 [&amp;lt;ffffffffa06c4b90&amp;gt;] ? target_recovery_thread+0x460/0x15d0 [ptlrpc]
 [&amp;lt;ffffffff810563bd&amp;gt;] ? finish_task_switch+0x7d/0x110
 [&amp;lt;ffffffffa06c4730&amp;gt;] ? target_recovery_thread+0x0/0x15d0 [ptlrpc]
 [&amp;lt;ffffffff8100c2ca&amp;gt;] ? child_rip+0xa/0x20
 [&amp;lt;ffffffff81500d50&amp;gt;] ? _spin_unlock_irq+0x30/0x40
 [&amp;lt;ffffffff8100bc10&amp;gt;] ? restore_args+0x0/0x30
 [&amp;lt;ffffffffa06c4730&amp;gt;] ? target_recovery_thread+0x0/0x15d0 [ptlrpc]
 [&amp;lt;ffffffff8100c2c0&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;discovering an bug found an commit with backporting an &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1522&quot; title=&quot;ASSERTION(cfs_atomic_read(&amp;amp;obd-&amp;gt;obd_req_replay_clients) == 0) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1522&quot;&gt;&lt;del&gt;LU-1522&lt;/del&gt;&lt;/a&gt;.&lt;br/&gt;
quick look say that bug exist in target_handle_connect() function on b2_1 also&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;        cfs_spin_lock(&amp;amp;target-&amp;gt;obd_recovery_task_lock);
        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (target-&amp;gt;obd_recovering &amp;amp;&amp;amp; !export-&amp;gt;exp_in_recovery &amp;amp;&amp;amp;
            !export-&amp;gt;exp_disconnected) {
                cfs_spin_lock(&amp;amp;export-&amp;gt;exp_lock);
                /* possible race with class_disconnect_stale_exports,
                 * export may be already in the eviction process */
                &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (export-&amp;gt;exp_failed) {
                        cfs_spin_unlock(&amp;amp;export-&amp;gt;exp_lock);
                        GOTO(out, rc = -ENODEV);
                }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;so if we have race with disconnect stale export we will exit from obd_recovery_task_lock held, that kill recovery and node at all.&lt;/p&gt;</description>
                <environment>RHEL6</environment>
        <key id="21785">LU-4197</key>
            <summary>deadlock in recovery</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="dmiter">Dmitry Eremin</assignee>
                                    <reporter username="shadow">Alexey Lyashkov</reporter>
                        <labels>
                            <label>patch</label>
                    </labels>
                <created>Fri, 1 Nov 2013 20:06:23 +0000</created>
                <updated>Tue, 15 Sep 2015 17:35:39 +0000</updated>
                            <resolved>Tue, 15 Sep 2015 17:35:39 +0000</resolved>
                                    <version>Lustre 2.1.6</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="70711" author="sergey" created="Tue, 5 Nov 2013 14:11:50 +0000"  >&lt;p&gt;Patch to solve this issue: &lt;a href=&quot;http://review.whamcloud.com/#/c/8178/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/8178/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="126167" author="green" created="Thu, 3 Sep 2015 14:47:15 +0000"  >&lt;p&gt;Is this patch needed anywhere else but 2.1.x codebase? 2.1.x is long unused, so if the issue is unique to 2.1.6, let&apos;s just close this ticket as WONTFIX&lt;/p&gt;</comment>
                            <comment id="126346" author="sergey" created="Fri, 4 Sep 2015 06:55:34 +0000"  >&lt;p&gt;It seems issue is unique for 2.1. I think we can close it.&lt;/p&gt;</comment>
                            <comment id="127369" author="adilger" created="Tue, 15 Sep 2015 17:35:39 +0000"  >&lt;p&gt;No longer being seen beyond 2.1.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw7n3:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>11384</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>