<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:48:46 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-5128] ASSERTION( atomic_read(&amp;obd-&gt;obd_req_replay_clients) == 0 ) failed</title>
                <link>https://jira.whamcloud.com/browse/LU-5128</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;MDS failovered and once MDS&apos;s  recovery finished, many OSS crahsed due to following ASSERTION.&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;2014-05-30 17:39:07 Lustre: Skipped 3 previous similar messages
2014-05-30 17:39:07 LustreError: 18967:0:(ldlm_lib.c:1851:target_next_replay_req()) ASSERTION( atomic_read(&amp;amp;obd-&amp;gt;obd_req_replay_clients) == 0 ) failed: 
2014-05-30 17:39:07 LustreError: 18967:0:(ldlm_lib.c:1851:target_next_replay_req()) LBUG
2014-05-30 17:39:07 Pid: 18967, comm: tgt_recov
2014-05-30 17:39:07 
2014-05-30 17:39:07 Call Trace:
2014-05-30 17:39:07  [&amp;lt;ffffffffa0353895&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
2014-05-30 17:39:07  [&amp;lt;ffffffffa0353e97&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
2014-05-30 17:39:07  [&amp;lt;ffffffffa066f48c&amp;gt;] target_recovery_thread+0x14ac/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffffa066dfe0&amp;gt;] ? target_recovery_thread+0x0/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
2014-05-30 17:39:07  [&amp;lt;ffffffffa066dfe0&amp;gt;] ? target_recovery_thread+0x0/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffffa066dfe0&amp;gt;] ? target_recovery_thread+0x0/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
2014-05-30 17:39:07 
2014-05-30 17:39:07 Kernel panic - not syncing: LBUG
2014-05-30 17:39:07 Pid: 18967, comm: tgt_recov Not tainted 2.6.32-358.18.1.el6_lustre.x86_64 #1
2014-05-30 17:39:07 Call Trace:
2014-05-30 17:39:07  [&amp;lt;ffffffff8150de58&amp;gt;] ? panic+0xa7/0x16f
2014-05-30 17:39:07  [&amp;lt;ffffffffa0353eeb&amp;gt;] ? lbug_with_loc+0x9b/0xb0 [libcfs]
2014-05-30 17:39:07  [&amp;lt;ffffffffa066f48c&amp;gt;] ? target_recovery_thread+0x14ac/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffffa066dfe0&amp;gt;] ? target_recovery_thread+0x0/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffff8100c0ca&amp;gt;] ? child_rip+0xa/0x20
2014-05-30 17:39:07  [&amp;lt;ffffffffa066dfe0&amp;gt;] ? target_recovery_thread+0x0/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffffa066dfe0&amp;gt;] ? target_recovery_thread+0x0/0x1970 [ptlrpc]
2014-05-30 17:39:07  [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1522&quot; title=&quot;ASSERTION(cfs_atomic_read(&amp;amp;obd-&amp;gt;obd_req_replay_clients) == 0) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1522&quot;&gt;&lt;del&gt;LU-1522&lt;/del&gt;&lt;/a&gt; and &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-2397&quot; title=&quot;Assertion triggered in check_for_next_transno&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-2397&quot;&gt;&lt;del&gt;LU-2397&lt;/del&gt;&lt;/a&gt; reported similar problem, but these patches have been merged in b2_4, already.&lt;/p&gt;</description>
                <environment>Lustre-2.4.3</environment>
        <key id="24981">LU-5128</key>
            <summary>ASSERTION( atomic_read(&amp;obd-&gt;obd_req_replay_clients) == 0 ) failed</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="hongchao.zhang">Hongchao Zhang</assignee>
                                    <reporter username="ihara">Shuichi Ihara</reporter>
                        <labels>
                            <label>duu</label>
                            <label>mn4</label>
                    </labels>
                <created>Sun, 1 Jun 2014 02:37:21 +0000</created>
                <updated>Mon, 18 Aug 2014 15:21:29 +0000</updated>
                            <resolved>Wed, 6 Aug 2014 14:58:58 +0000</resolved>
                                    <version>Lustre 2.4.3</version>
                                    <fixVersion>Lustre 2.7.0</fixVersion>
                    <fixVersion>Lustre 2.5.3</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="85509" author="pjones" created="Mon, 2 Jun 2014 19:48:53 +0000"  >&lt;p&gt;Hongchao&lt;/p&gt;

&lt;p&gt;Could you please advise on this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="85981" author="hongchao.zhang" created="Fri, 6 Jun 2014 06:15:42 +0000"  >&lt;p&gt;Hi,&lt;/p&gt;

&lt;p&gt;Could you please attach the whole logs of this issue, thanks!&lt;br/&gt;
btw, did the OSS also failovered along with MDS?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;</comment>
                            <comment id="86002" author="hongchao.zhang" created="Fri, 6 Jun 2014 13:44:37 +0000"  >&lt;p&gt;there could be a race between &quot;target_process_req_flags&quot; and &quot;class_export_recovery_cleanup&quot;, and if the replay request contains the flag&lt;br/&gt;
&quot;MSG_REQ_REPLAY_DONE&quot;, the &quot;exp-&amp;gt;exp_req_replay_needed&quot; will be cleared and &quot;obd-&amp;gt;obd_req_replay_clients&quot; will be decreased with&lt;br/&gt;
protection &quot;exp_lock&quot; in &quot;target_process_req_flags&quot;. but &quot;class_export_recovery_cleanup&quot; checks the &quot;exp_req_replay_needed&quot; without the lock&lt;br/&gt;
&quot;exp_lock&quot;, then it could decrement &quot;obd_req_replay_clients&quot; once more and causes this issue.&lt;/p&gt;

&lt;p&gt;the patch against b2_4 is tracked at &lt;a href=&quot;http://review.whamcloud.com/#/c/10628/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/10628/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="87357" author="ihara" created="Tue, 24 Jun 2014 12:13:56 +0000"  >&lt;p&gt;this only happens on b2_4 branch or same problem maybe occur even on b2_5?&lt;/p&gt;</comment>
                            <comment id="87474" author="hongchao.zhang" created="Wed, 25 Jun 2014 09:14:13 +0000"  >&lt;p&gt;the issue tracked at &lt;a href=&quot;http://review.whamcloud.com/#/c/10628/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/10628/&lt;/a&gt; also exists on b2_5&lt;/p&gt;</comment>
                            <comment id="87566" author="hongchao.zhang" created="Thu, 26 Jun 2014 15:08:47 +0000"  >&lt;p&gt;the patch against master is tracked at &lt;a href=&quot;http://review.whamcloud.com/#/c/10849/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/10849/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="89008" author="gnlwlb" created="Tue, 15 Jul 2014 08:47:52 +0000"  >&lt;p&gt;Here is the patch for b2_5: &lt;a href=&quot;http://review.whamcloud.com/#/c/11102/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/11102/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="90971" author="pjones" created="Wed, 6 Aug 2014 14:58:58 +0000"  >&lt;p&gt;Landed for 2.7&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwni7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>14153</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>