<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:15:57 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-8255] LustreError: 38237:0:(file.c:3165:ll_inode_revalidate_fini()) nbp6: revalidate FID [0x20007200e:0x90d8:0x0] error: rc = -71</title>
                <link>https://jira.whamcloud.com/browse/LU-8255</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>
&lt;p&gt;For one particular user&apos;s on the clients we are getting lots of these error.&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;Jun  9 15:23:12 r221i4s0 kernel: [1465510992.386829] LustreError: 11-0: nbp6-MDT0000-mdc-ffff8803058bb000: operation ldlm_enqueue to node 10.151.26.79@o2ib failed: rc = -71
Jun  9 15:23:12 r221i4s0 kernel: [1465510992.398829] LustreError: Skipped 5 previous similar messages
Jun  9 15:23:12 r221i4s0 kernel: [1465510992.406829] LustreError: 74346:0:(file.c:3165:ll_inode_revalidate_fini()) nbp6: revalidate FID [0x200071fef:0x1fd19:0x0] error: rc = -71
Jun  9 15:23:12 r221i4s0 kernel: [1465510992.406829] LustreError: 74346:0:(file.c:3165:ll_inode_revalidate_fini()) Skipped 5 previous similar messages
Jun  9 15:23:13 r154i0n0 kernel: [1465510993.479567] LustreError: 11-0: nbp6-MDT0000-mdc-ffff880302239800: operation ldlm_enqueue to node 10.151.26.79@o2ib failed: rc = -71
Jun  9 15:23:13 r154i0n0 kernel: [1465510993.491567] LustreError: Skipped 2 previous similar messages
Jun  9 15:23:13 r154i0n0 kernel: [1465510993.495567] LustreError: 68877:0:(file.c:3165:ll_inode_revalidate_fini()) nbp6: revalidate FID [0x200072005:0x11ea5:0x0] error: rc = -71
Jun  9 15:23:13 r154i0n0 kernel: [1465510993.495567] LustreError: 68877:0:(file.c:3165:ll_inode_revalidate_fini()) Skipped 2 previous similar messages
Jun  9 15:23:16 r221i3n1 kernel: [1465510996.818948] LustreError: 11-0: nbp6-MDT0000-mdc-ffff880302157000: operation ldlm_enqueue to node 10.151.26.79@o2ib failed: rc = -71
Jun  9 15:23:16 r221i3n1 kernel: [1465510996.830948] LustreError: 68219:0:(file.c:3165:ll_inode_revalidate_fini()) nbp6: revalidate FID [0x200071ef9:0x1dfce:0x0] er
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I will upload MDS side debug to ftp site.&lt;/p&gt;

</description>
                <environment>Client is running lustre 2.7.1 &lt;br/&gt;
Server is running lustre 2.5.3</environment>
        <key id="37517">LU-8255</key>
            <summary>LustreError: 38237:0:(file.c:3165:ll_inode_revalidate_fini()) nbp6: revalidate FID [0x20007200e:0x90d8:0x0] error: rc = -71</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="4">Incomplete</resolution>
                                        <assignee username="yong.fan">nasf</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Thu, 9 Jun 2016 22:44:38 +0000</created>
                <updated>Thu, 29 Jun 2017 13:11:28 +0000</updated>
                            <resolved>Thu, 29 Jun 2017 13:11:28 +0000</resolved>
                                    <version>Lustre 2.7.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="155309" author="mhanafi" created="Thu, 9 Jun 2016 22:45:22 +0000"  >&lt;p&gt;uploaded logs to /uploads/&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8255&quot; title=&quot;LustreError: 38237:0:(file.c:3165:ll_inode_revalidate_fini()) nbp6: revalidate FID [0x20007200e:0x90d8:0x0] error: rc = -71&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8255&quot;&gt;&lt;del&gt;LU-8255&lt;/del&gt;&lt;/a&gt;/mds.debugout.gz&lt;/p&gt;</comment>
                            <comment id="155322" author="mhanafi" created="Thu, 9 Jun 2016 23:52:50 +0000"  >&lt;p&gt;Looks like the user&apos;s job is creating and deleting lots of files and directories. &lt;/p&gt;</comment>
                            <comment id="155400" author="pjones" created="Fri, 10 Jun 2016 17:25:47 +0000"  >&lt;p&gt;Fan Yong&lt;/p&gt;

&lt;p&gt;Could you please advise?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="155448" author="yong.fan" created="Sun, 12 Jun 2016 06:17:26 +0000"  >&lt;p&gt;The log is some huge (1.2 GB), but only contains some Lustre level debug like following:&lt;/p&gt;

&lt;blockquote&gt;
&lt;p&gt;...&lt;br/&gt;
00010000:00010000:1.0:1465510946.072747:0:39779:0:(ldlm_lockd.c:1181:ldlm_handle_enqueue0()) ### server-side enqueue handler START&lt;br/&gt;
00010000:00010000:1.0:1465510946.072750:0:39779:0:(ldlm_lockd.c:1269:ldlm_handle_enqueue0()) ### server-side enqueue handler, new lock created ns: mdt-nbp6-MDT0000_UUID lock: ffff88031d104740/0xbbcac3f0ff4e9f58 lrc: 2/0,0 mode: --/CR res: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x20007200f:0xbad7:0x0&amp;#93;&lt;/span&gt;.0 bits 0x0 rrc: 1 type: IBT flags: 0x40000000000000 nid: local remote: 0x3afc5dc70a36e37f expref: -99 pid: 39779 timeout: 0 lvb_type: 0&lt;br/&gt;
00010000:00010000:1.0:1465510946.072766:0:39779:0:(ldlm_lockd.c:1407:ldlm_handle_enqueue0()) ### server-side enqueue handler, sending reply(err=0, rc=-71) ns: mdt-nbp6-MDT0000_UUID lock: ffff88031d104740/0xbbcac3f0ff4e9f58 lrc: 1/0,0 mode: --/CR res: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x20007200f:0xbad7:0x0&amp;#93;&lt;/span&gt;.0 bits 0x2 rrc: 1 type: IBT flags: 0x44000000000000 nid: 10.151.40.7@o2ib remote: 0x3afc5dc70a36e37f expref: 10810 pid: 39779 timeout: 0 lvb_type: 0&lt;br/&gt;
00010000:00010000:1.0:1465510946.072771:0:39779:0:(ldlm_lock.c:219:ldlm_lock_put()) ### final lock_put on destroyed lock, freeing it. ns: mdt-nbp6-MDT0000_UUID lock: ffff88031d104740/0xbbcac3f0ff4e9f58 lrc: 0/0,0 mode: --/CR res: &lt;span class=&quot;error&quot;&gt;&amp;#91;0x20007200f:0xbad7:0x0&amp;#93;&lt;/span&gt;.0 bits 0x2 rrc: 1 type: IBT flags: 0x44000000000000 nid: 10.151.40.7@o2ib remote: 0x3afc5dc70a36e37f expref: 10810 pid: 39779 timeout: 0 lvb_type: 0&lt;br/&gt;
00010000:00010000:1.0:1465510946.072775:0:39779:0:(ldlm_lockd.c:1450:ldlm_handle_enqueue0()) ### server-side enqueue handler END (lock ffff88031d104740, rc -71)&lt;br/&gt;
00000100:00100000:1.0:1465510946.072787:0:39779:0:(service.c:2074:ptlrpc_server_handle_request()) Handled RPC pname:cluuid+ref:pid:xid:nid:opc mdt00_091:f83705d3-c797-c136-06e3-a15eff96d960+10809:46841:x1535100545951340:12345-10.151.40.7@o2ib:101 Request procesed in 45us (78us total) trans 0 rc -71/-71&lt;br/&gt;
...&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;That means the server returned protocol error when handle ldlm enqueue RPC from the client. But without detailed logs, we cannot exactly point out where is wrong. I have ever try to simulate the interoperability trouble (client b2_7, server b2_5) locally, but cannot reproduce it. So please enable -1 level debug log on both the client and the MDS for a short time, and try the failed operation again, then please collect the Lustre debug logs on both the client and the MDS, and attach them on this Jira ticket directly.&lt;/p&gt;

&lt;p&gt;Thanks!&lt;/p&gt;

&lt;p&gt;(note: to make the debug logs to be small, please run &quot;lctl clear&quot; on both the client and the MDS before the new try)&lt;/p&gt;</comment>
                            <comment id="158792" author="yong.fan" created="Thu, 14 Jul 2016 10:14:22 +0000"  >&lt;p&gt;Any feedback? Thanks!&lt;/p&gt;</comment>
                            <comment id="200577" author="mhanafi" created="Thu, 29 Jun 2017 13:08:18 +0000"  >&lt;p&gt;We can close this case&lt;/p&gt;</comment>
                            <comment id="200582" author="pjones" created="Thu, 29 Jun 2017 13:11:28 +0000"  >&lt;p&gt;ok Mahmoud&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzyeaf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>