<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:11:59 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-948] Client recovery hang</title>
                <link>https://jira.whamcloud.com/browse/LU-948</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;When I rebooted two OSS to put a patch for bug &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-874&quot; title=&quot;Client eviction on lock callback timeout &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-874&quot;&gt;&lt;del&gt;LU-874&lt;/del&gt;&lt;/a&gt; on the servers, quite a few of the clients have appear to have gotten deadlocked in recovery.  Here&apos;s a backtrace of ptlrpcd-rcv on on client:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;crash&amp;gt; bt 5077
PID: 5077   TASK: ffff88082da834c0  CPU: 8   COMMAND: &quot;ptlrpcd-rcv&quot;
 #0 [ffff88082da85430] schedule at ffffffff814ee3b2
 #1 [ffff88082da854f8] io_schedule at ffffffff814eeba3
 #2 [ffff88082da85518] sync_page at ffffffff81110fbd
 #3 [ffff88082da85528] __wait_on_bit_lock at ffffffff814ef40a
 #4 [ffff88082da85578] __lock_page at ffffffff81110f57
 #5 [ffff88082da855d8] vvp_page_own at ffffffffa093bf6a [lustre]
 #6 [ffff88082da855f8] cl_page_own0 at ffffffffa0601d3b [obdclass]
 #7 [ffff88082da85678] cl_page_own at ffffffffa0601fa0 [obdclass]
 #8 [ffff88082da85688] cl_page_gang_lookup at ffffffffa0603bb7 [obdclass]
 #9 [ffff88082da85758] cl_lock_page_out at ffffffffa06096fc [obdclass]
#10 [ffff88082da85808] osc_lock_flush at ffffffffa0858e8f [osc]
#11 [ffff88082da85858] osc_lock_cancel at ffffffffa0858f2a [osc]
#12 [ffff88082da858d8] cl_lock_cancel0 at ffffffffa0604665 [obdclass]
#13 [ffff88082da85928] cl_lock_cancel at ffffffffa06051ab [obdclass]
#14 [ffff88082da85968] osc_ldlm_blocking_ast at ffffffffa0859cf8 [osc]
#15 [ffff88082da859f8] ldlm_cancel_callback at ffffffffa06a1ba3 [ptlrpc]
#16 [ffff88082da85a18] ldlm_lock_cancel at ffffffffa06a1c89 [ptlrpc]
#17 [ffff88082da85a58] ldlm_cli_cancel_list_local at ffffffffa06bede8 [ptlrpc]
#18 [ffff88082da85ae8] ldlm_cancel_lru_local at ffffffffa06bf255 [ptlrpc]
#19 [ffff88082da85b08] ldlm_replay_locks at ffffffffa06bf385 [ptlrpc]
#20 [ffff88082da85bb8] ptlrpc_import_recovery_state_machine at ffffffffa070ceea [ptlrpc]
#21 [ffff88082da85c38] ptlrpc_connect_interpret at ffffffffa070db38 [ptlrpc]
#22 [ffff88082da85d08] ptlrpc_check_set at ffffffffa06dd870 [ptlrpc]
#23 [ffff88082da85de8] ptlrpcd_check at ffffffffa07113b8 [ptlrpc]
#24 [ffff88082da85e48] ptlrpcd at ffffffffa071175b [ptlrpc]
#25 [ffff88082da85f48] kernel_thread at ffffffff8100c14a
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I will need to do more investigation, but thats a start.&lt;/p&gt;</description>
                <environment></environment>
        <key id="12732">LU-948</key>
            <summary>Client recovery hang</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="6" iconUrl="https://jira.whamcloud.com/images/icons/statuses/closed.png" description="The issue is considered finished, the resolution is correct. Issues which are closed can be reopened.">Closed</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="jay">Jinshan Xiong</assignee>
                                    <reporter username="morrone">Christopher Morrone</reporter>
                        <labels>
                            <label>llnl</label>
                    </labels>
                <created>Tue, 20 Dec 2011 17:39:39 +0000</created>
                <updated>Tue, 16 Aug 2016 16:37:15 +0000</updated>
                            <resolved>Tue, 16 Aug 2016 16:37:15 +0000</resolved>
                                    <version>Lustre 2.1.0</version>
                                    <fixVersion>Lustre 2.2.0</fixVersion>
                    <fixVersion>Lustre 2.1.3</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="25022" author="morrone" created="Tue, 20 Dec 2011 17:48:35 +0000"  >&lt;p&gt;Backtrace of all tasks on a hung client, and a dump_pages.&lt;/p&gt;</comment>
                            <comment id="25026" author="pjones" created="Tue, 20 Dec 2011 18:31:32 +0000"  >&lt;p&gt;Jinshan is looking into this&lt;/p&gt;</comment>
                            <comment id="25030" author="jay" created="Tue, 20 Dec 2011 18:42:28 +0000"  >&lt;p&gt;Do you have a chance to dump lustre log at clients?&lt;/p&gt;</comment>
                            <comment id="25044" author="morrone" created="Tue, 20 Dec 2011 21:22:18 +0000"  >&lt;p&gt;No, unfortunately someone rebooted the cluster out from under me.  That was all that I could grab before the nodes went dead.&lt;/p&gt;</comment>
                            <comment id="25087" author="jay" created="Wed, 21 Dec 2011 12:05:37 +0000"  >&lt;p&gt;I&apos;ve known the root cause of this problem. If there is a BRW RPC in the resending list, canceling the ldlm lock will cause deadlock since it will try to hold page lock. A workaround to fix this problem is by disabling ldlm_cancel_unused_locks_before_replay via procfs.&lt;/p&gt;

&lt;p&gt;I&apos;m working on a fix.&lt;/p&gt;</comment>
                            <comment id="26310" author="morrone" created="Tue, 10 Jan 2012 18:45:42 +0000"  >&lt;p&gt;With &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-874&quot; title=&quot;Client eviction on lock callback timeout &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-874&quot;&gt;&lt;del&gt;LU-874&lt;/del&gt;&lt;/a&gt; much improved, this is our next concern for 2.1.  Have you had any time to look at the fix for this?&lt;/p&gt;</comment>
                            <comment id="26317" author="jay" created="Tue, 10 Jan 2012 20:20:23 +0000"  >&lt;p&gt;I think this issue can be fixed by reverting commit 6fd5e00ff03d41b427eec5d70efaef4bbdd8d59c which was added in bug 16774 to address client replaying lots of unused lock during recovery.&lt;/p&gt;

&lt;p&gt;Since this issue was filed and even implemented by you guys, can you please tell me what&apos;s the side effect for clients to replay unused lock during recovery?&lt;/p&gt;</comment>
                            <comment id="26319" author="morrone" created="Tue, 10 Jan 2012 20:55:38 +0000"  >&lt;p&gt;We only implemented some of the 1.8 version.  The CLIO version for 2.X doesn&apos;t look at all familiar to me.&lt;/p&gt;

&lt;p&gt;In production, clients will need to replay tens of thousands of locks, which completely overwhelms the servers.  Since most of those locks are completely usused, it is better to drop the unused locks rather than replay them.  If they are needed again in the future, the load to recreate them on demand is easier to deal with than the flood of lock replays at recovery time.&lt;/p&gt;

&lt;p&gt;At the time we could even see the problem with just one or a few clients.  If you did something like a linux kernel compilation out of lustre, you will wind up with tens of thousands of locks on just that one node.&lt;/p&gt;

&lt;p&gt;I don&apos;t think we really want to abandon this ability.&lt;/p&gt;</comment>
                            <comment id="26409" author="jay" created="Wed, 11 Jan 2012 22:56:36 +0000"  >&lt;p&gt;patch is at: &lt;a href=&quot;http://review.whamcloud.com/1955&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/1955&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="27132" author="hudson" created="Fri, 20 Jan 2012 15:05:21 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=client,distro=sles11,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,client,sles11,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27133" author="hudson" created="Fri, 20 Jan 2012 15:17:11 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=server,distro=el5,ib_stack=ofa/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,server,el5,ofa #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27136" author="hudson" created="Fri, 20 Jan 2012 15:22:53 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=client,distro=el5,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,client,el5,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27137" author="hudson" created="Fri, 20 Jan 2012 15:24:46 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=i686,build_type=server,distro=el6,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; i686,server,el6,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27138" author="hudson" created="Fri, 20 Jan 2012 15:29:54 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=server,distro=el5,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,server,el5,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27139" author="hudson" created="Fri, 20 Jan 2012 15:31:45 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=client,distro=el5,ib_stack=ofa/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,client,el5,ofa #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27140" author="hudson" created="Fri, 20 Jan 2012 15:35:26 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=client,distro=el6,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,client,el6,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27142" author="hudson" created="Fri, 20 Jan 2012 15:44:14 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=i686,build_type=client,distro=el6,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; i686,client,el6,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27143" author="hudson" created="Fri, 20 Jan 2012 15:49:02 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=client,distro=ubuntu1004,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,client,ubuntu1004,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27144" author="hudson" created="Fri, 20 Jan 2012 15:54:11 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=x86_64,build_type=server,distro=el6,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; x86_64,server,el6,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27149" author="hudson" created="Fri, 20 Jan 2012 16:38:10 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=i686,build_type=server,distro=el5,ib_stack=ofa/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; i686,server,el5,ofa #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27151" author="hudson" created="Fri, 20 Jan 2012 16:42:04 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=i686,build_type=server,distro=el5,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; i686,server,el5,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27155" author="hudson" created="Fri, 20 Jan 2012 16:58:44 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=i686,build_type=client,distro=el5,ib_stack=inkernel/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; i686,client,el5,inkernel #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27156" author="hudson" created="Fri, 20 Jan 2012 17:06:45 +0000"  >&lt;p&gt;Integrated in &lt;span class=&quot;image-wrap&quot; style=&quot;&quot;&gt;&lt;img src=&quot;http://build.whamcloud.com/images/16x16/blue.png&quot; style=&quot;border: 0px solid black&quot; /&gt;&lt;/span&gt; &lt;a href=&quot;http://build.whamcloud.com/job/lustre-master/./arch=i686,build_type=client,distro=el5,ib_stack=ofa/440/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;lustre-master &#187; i686,client,el5,ofa #440&lt;/a&gt;&lt;br/&gt;
     &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup() (Revision 7076eff5cd415472061a26c897469dd5b8174861)&lt;/p&gt;

&lt;p&gt;     Result = SUCCESS&lt;br/&gt;
Oleg Drokin : &lt;a href=&quot;http://git.whamcloud.com/gitweb?p=fs/lustre-release.git;a=shortlog;h=refs/heads/master&amp;amp;a=commit&amp;amp;h=7076eff5cd415472061a26c897469dd5b8174861&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;7076eff5cd415472061a26c897469dd5b8174861&lt;/a&gt;&lt;br/&gt;
Files : &lt;/p&gt;
&lt;ul&gt;
	&lt;li&gt;lustre/obdclass/cl_lock.c&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_internal.h&lt;/li&gt;
	&lt;li&gt;lustre/include/cl_object.h&lt;/li&gt;
	&lt;li&gt;lustre/obdclass/cl_page.c&lt;/li&gt;
	&lt;li&gt;lustre/osc/osc_lock.c&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="27423" author="pjones" created="Thu, 26 Jan 2012 10:05:12 +0000"  >&lt;p&gt;Landed for 2.2&lt;/p&gt;</comment>
                            <comment id="38343" author="bogl" created="Tue, 8 May 2012 17:12:07 +0000"  >&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/#change,2690&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,2690&lt;/a&gt;&lt;br/&gt;
back port to b2_1&lt;/p&gt;</comment>
                            <comment id="44009" author="nedbass" created="Thu, 30 Aug 2012 15:48:12 +0000"  >&lt;p&gt;We hit this assertion during testing after cherry-picking &lt;a href=&quot;http://review.whamcloud.com/#change,1955&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,1955&lt;/a&gt; into our 2.1.2 branch.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;LustreError: 3846:0:(vvp_page.c:167:vvp_page_unmap()) ASSERTION(PageLocked(vmpage)) failed
LustreError: 3846:0:(vvp_page.c:167:vvp_page_unmap()) LBUG

PID: 3846   TASK: ffff88054af26aa0  CPU: 3   COMMAND: &quot;ldlm_bl_10&quot;
 #0 [ffff880567895948] machine_kexec at ffffffff8103216b
 #1 [ffff8805678959a8] crash_kexec at ffffffff810b8d12
 #2 [ffff880567895a78] panic at ffffffff814ee999
 #3 [ffff880567895af8] lbug_with_loc at ffffffffa0515e1b [libcfs]
 #4 [ffff880567895b18] libcfs_assertion_failed at ffffffffa051f42d [libcfs]
 #5 [ffff880567895b38] vvp_page_unmap at ffffffffa0aebc8c [lustre]
 #6 [ffff880567895b68] cl_page_invoke at ffffffffa06982f8 [obdclass]
 #7 [ffff880567895ba8] cl_page_unmap at ffffffffa0698383 [obdclass]
 #8 [ffff880567895bb8] check_and_discard_cb at ffffffffa069f6be [obdclass]
 #9 [ffff880567895c08] cl_page_gang_lookup at ffffffffa069b763 [obdclass]
#10 [ffff880567895cb8] cl_lock_page_out at ffffffffa069ce3b [obdclass]
#11 [ffff880567895d28] osc_lock_flush at ffffffffa09c197f [osc]
#12 [ffff880567895d78] osc_lock_cancel at ffffffffa09c1a19 [osc]
#13 [ffff880567895dc8] cl_lock_cancel0 at ffffffffa069c085 [obdclass]
#14 [ffff880567895df8] cl_lock_cancel at ffffffffa069c8b3 [obdclass]
#15 [ffff880567895e18] osc_ldlm_blocking_ast at ffffffffa09c2673 [osc]
#16 [ffff880567895e88] ldlm_handle_bl_callback at ffffffffa07a7db4 [ptlrpc]
#17 [ffff880567895eb8] ldlm_bl_thread_main at ffffffffa07a8139 [ptlrpc]
#18 [ffff880567895f48] kernel_thread at ffffffff8100c14a
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="44021" author="jay" created="Thu, 30 Aug 2012 19:40:57 +0000"  >&lt;p&gt;please apply patch at &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1059&quot; title=&quot;vvp_page_unmap()) ASSERTION(PageLocked(vmpage))&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1059&quot;&gt;&lt;del&gt;LU-1059&lt;/del&gt;&lt;/a&gt; &lt;/p&gt;</comment>
                            <comment id="44057" author="nedbass" created="Fri, 31 Aug 2012 16:16:16 +0000"  >&lt;p&gt;Thanks, that patch cleared up the vvp_page_unmap() assertion.  We&apos;re now testing recovery with this tag &lt;a href=&quot;https://github.com/chaos/lustre/commits/2.1.2-3chaos&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://github.com/chaos/lustre/commits/2.1.2-3chaos&lt;/a&gt; plus the following patches.&lt;/p&gt;

&lt;ul&gt;
	&lt;li&gt;c882f3a &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1059&quot; title=&quot;vvp_page_unmap()) ASSERTION(PageLocked(vmpage))&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1059&quot;&gt;&lt;del&gt;LU-1059&lt;/del&gt;&lt;/a&gt; clio: to not try to discard freeing pages&lt;/li&gt;
	&lt;li&gt;9286c90 &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-948&quot; title=&quot;Client recovery hang&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-948&quot;&gt;&lt;del&gt;LU-948&lt;/del&gt;&lt;/a&gt; clio: add a callback to cl_page_gang_lookup()&lt;/li&gt;
	&lt;li&gt;82a8948 &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1716&quot; title=&quot;Race in setting connection flags and using them on 2.x client connect&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1716&quot;&gt;&lt;del&gt;LU-1716&lt;/del&gt;&lt;/a&gt; ptlrpc: Race in updating of connection flags on client.&lt;/li&gt;
	&lt;li&gt;8812d32 &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1299&quot; title=&quot;running truncated executable causes spewing of lock debug messages&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1299&quot;&gt;&lt;del&gt;LU-1299&lt;/del&gt;&lt;/a&gt; clio: set the lock to CLS_NEW if unuse returns error&lt;/li&gt;
&lt;/ul&gt;


&lt;p&gt;Unfortunately I just found another client deadlocked in recovery with a similar stack trace to the description.  So I&apos;m afraid  &lt;a href=&quot;http://review.whamcloud.com/#change,1955&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,1955&lt;/a&gt; i does not fix the problem.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;
crash&amp;gt; bt 6257
PID: 6257   TASK: ffff8808317ccaa0  CPU: 4   COMMAND: &quot;ptlrpcd-rcv&quot;
 #0 [ffff88083084b680] schedule at ffffffff814ef052
 #1 [ffff88083084b748] io_schedule at ffffffff814ef833
 #2 [ffff88083084b768] sync_page at ffffffff81110d5d
 #3 [ffff88083084b778] __wait_on_bit_lock at ffffffff814f009a
 #4 [ffff88083084b7c8] __lock_page at ffffffff81110cf7
 #5 [ffff88083084b828] vvp_page_own at ffffffffa09ce18a [lustre]
 #6 [ffff88083084b858] cl_page_own0 at ffffffffa05ace9b [obdclass]
 #7 [ffff88083084b8a8] cl_page_own at ffffffffa05ad070 [obdclass]
 #8 [ffff88083084b8b8] check_and_discard_cb at ffffffffa05b26af [obdclass]
 #9 [ffff88083084b908] cl_page_gang_lookup at ffffffffa05ae763 [obdclass]
#10 [ffff88083084b9b8] cl_lock_page_out at ffffffffa05afe3b [obdclass]
#11 [ffff88083084ba28] osc_lock_flush at ffffffffa08b697f [osc]
#12 [ffff88083084ba78] osc_lock_cancel at ffffffffa08b6a19 [osc]
#13 [ffff88083084bac8] cl_lock_cancel0 at ffffffffa05af085 [obdclass]
#14 [ffff88083084baf8] cl_lock_cancel at ffffffffa05af8b3 [obdclass]
#15 [ffff88083084bb18] osc_ldlm_blocking_ast at ffffffffa08b7673 [osc]
#16 [ffff88083084bb88] ldlm_cancel_callback at ffffffffa06a0083 [ptlrpc]
#17 [ffff88083084bba8] ldlm_lock_cancel at ffffffffa06a0165 [ptlrpc]
#18 [ffff88083084bbc8] ldlm_cli_cancel_list_local at ffffffffa06b7698 [ptlrpc]
#19 [ffff88083084bc28] ldlm_cancel_lru_local at ffffffffa06b7a95 [ptlrpc]
#20 [ffff88083084bc48] ldlm_replay_locks at ffffffffa06b7b9f [ptlrpc]
#21 [ffff88083084bcc8] ptlrpc_import_recovery_state_machine at ffffffffa06f5c26 [ptlrpc]
#22 [ffff88083084bd08] ptlrpc_connect_interpret at ffffffffa06f65bd [ptlrpc]
#23 [ffff88083084bda8] ptlrpc_check_set at ffffffffa06d0955 [ptlrpc]
#24 [ffff88083084be48] ptlrpcd_check at ffffffffa06f8ee0 [ptlrpc]
#25 [ffff88083084be78] ptlrpcd at ffffffffa06f91fb [ptlrpc]
#26 [ffff88083084bf48] kernel_thread at ffffffff8100c14a
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="44187" author="jay" created="Wed, 5 Sep 2012 00:58:16 +0000"  >&lt;p&gt;Hi Ned, can you please show me the backtrace of other processes when this issue happened?&lt;/p&gt;</comment>
                            <comment id="46642" author="morrone" created="Tue, 16 Oct 2012 20:17:18 +0000"  >&lt;p&gt;Jinshan, here is a console log showing all backtraces on the system.  I&apos;m not entirely certain if this will be useful, because this node was a PPC64 box running the older 2.1.0-13chaos code.  2.1.0-13chaos did NOT have the  &lt;a href=&quot;http://review.whamcloud.com/1955&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/1955&lt;/a&gt; fix.&lt;/p&gt;

&lt;p&gt;But the backtrace is the same for ptlrpcd-rcv, and you can see some other processes with backtraces under lustre (&quot;cp&quot; looks like an interesting one).  I will attach seqlac2_console.txt.&lt;/p&gt;</comment>
                            <comment id="46643" author="morrone" created="Tue, 16 Oct 2012 20:18:09 +0000"  >&lt;p&gt;Attached seqlac2_console.txt showing backtraces of all processes on a PPC64 client.&lt;/p&gt;</comment>
                            <comment id="46824" author="jay" created="Sun, 21 Oct 2012 15:08:44 +0000"  >&lt;p&gt;Sorry for delay response. This must be a race in read ahead pages vs. dlm lock issue, I&apos;m looking at it.&lt;/p&gt;</comment>
                            <comment id="162057" author="simmonsja" created="Tue, 16 Aug 2016 16:37:15 +0000"  >&lt;p&gt;Old ticket for unsupported version&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="13089">LU-1066</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="13050">LU-1059</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="10693" name="hype320_bt_pages.txt.bz2" size="9502340" author="morrone" created="Tue, 20 Dec 2011 17:48:35 +0000"/>
                            <attachment id="11970" name="seqlac2_console.txt" size="831139" author="morrone" created="Tue, 16 Oct 2012 20:18:09 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10490" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>End date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Fri, 27 Jun 2014 17:39:39 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzv7k7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>4759</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10493" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>Start date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Tue, 20 Dec 2011 17:39:39 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                    </customfields>
    </item>
</channel>
</rss>