<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:29:46 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-9843]  LNetError: 57600:0:(linux-cpu.c:572:cfs_cpt_spread_node()) LBUG</title>
                <link>https://jira.whamcloud.com/browse/LU-9843</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Client hit LBUG.&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;[1498857336.755629] LNetError: 57600:0:(linux-cpu.c:572:cfs_cpt_spread_node()) LBUG
[1498857336.779630] Pid: 57600, comm: lfs
[1498857336.779630] LNetError: 57594:0:(linux-cpu.c:572:cfs_cpt_spread_node()) LBUG
[1498857336.779630] LNetError: 57588:0:(linux-cpu.c:572:cfs_cpt_spread_node()) LBUG
[1498857336.779630] Pid: 57594, comm: lfs
[1498857336.779630] 
[1498857336.779630] Call Trace:
[1498857336.779630] Pid: 57588, comm: lfs
[1498857336.779630] 
[14988573 3 67.7 o7u96t 3o0]f 8Ca cllp usT rainc e:kd^Mb
, waiting &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; the &lt;span class=&quot;code-keyword&quot;&gt;rest&lt;/span&gt;, timeout in 10 second(s)
[1498857336.779630] [&amp;lt;ffffffff81004b35&amp;gt;] dump_trace+0x75/0x300
[1498857336.779630] [&amp;lt;ffffffff81004b35&amp;gt;] dump_trace+0x75/0x300
[1498857336.779630] [&amp;lt;ffffffffa09df82a&amp;gt;] libcfs_debug_dumpstack+0x4a/0x70 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09df82a&amp;gt;] libcfs_debug_dumpstack+0x4a/0x70 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09dfd5e&amp;gt;] lbug_with_loc+0x3e/0xb0 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09dfd5e&amp;gt;] lbug_with_loc+0x3e/0xb0 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09e18a6&amp;gt;] cfs_cpt_spread_node+0xf6/0x130 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09e18a6&amp;gt;] cfs_cpt_spread_node+0xf6/0x130 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09e0488&amp;gt;] cfs_cpt_malloc+0x18/0x40 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09e0488&amp;gt;] cfs_cpt_malloc+0x18/0x40 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa0d1d60b&amp;gt;] ptlrpc_prep_set+0x4b/0x310 [ptlrpc]
[1498857336.779630] [&amp;lt;ffffffffa0d1d60b&amp;gt;] ptlrpc_prep_set+0x4b/0x310 [ptlrpc]
[1498857336.779630] [&amp;lt;ffffffffa0d238ac&amp;gt;] ptlrpc_queue_wait+0x3c/0x220 [ptlrpc]
[1498857336.779630] [&amp;lt;ffffffffa0d238ac&amp;gt;] ptlrpc_queue_wait+0x3c/0x220 [ptlrpc]
[1498857336.779630] [&amp;lt;ffffffffa1086993&amp;gt;] osc_quotactl+0xf3/0x360 [osc]
[1498857336.779630] [&amp;lt;ffffffffa1086993&amp;gt;] osc_quotactl+0xf3/0x360 [osc]
[1498857336.779630] [&amp;lt;ffffffffa0ecb8ea&amp;gt;] lov_quotactl+0x38a/0x930 [lov]
[1498857336.779630] [&amp;lt;ffffffffa0ecb8ea&amp;gt;] lov_quotactl+0x38a/0x930 [lov]
[1498857336.779630] [&amp;lt;ffffffffa0f2f4d9&amp;gt;] obd_quotactl+0xb9/0x340 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f2f4d9&amp;gt;] obd_quotactl+0xb9/0x340 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f3552b&amp;gt;] quotactl_ioctl+0x100b/0x15b0 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f3552b&amp;gt;] quotactl_ioctl+0x100b/0x15b0 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f37a48&amp;gt;] ll_dir_ioctl+0x1908/0x62f0 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f37a48&amp;gt;] ll_dir_ioctl+0x1908/0x62f0 [lustre]
[1498857336.779630] [&amp;lt;ffffffff8117117b&amp;gt;] do_vfs_ioctl+0x8b/0x3b0
[1498857336.779630] [&amp;lt;ffffffff8117117b&amp;gt;] do_vfs_ioctl+0x8b/0x3b0
[1498857336.779630] [&amp;lt;ffffffff81171541&amp;gt;] sys_ioctl+0xa1/0xb0
[1498857336.779630] [&amp;lt;ffffffff81171541&amp;gt;] sys_ioctl+0xa1/0xb0
[1498857336.779630] [&amp;lt;ffffffff81483972&amp;gt;] system_call_fastpath+0x16/0x1b
[1498857336.779630] [&amp;lt;ffffffff81483972&amp;gt;] system_call_fastpath+0x16/0x1b
[1498857336.779630] [&amp;lt;00007fffed63f9a7&amp;gt;] 0x7fffed63f9a7
[1498857336.779630] [&amp;lt;00007fffed63f9a7&amp;gt;] 0x7fffed63f9a7
[1498857336.779630] 
[1498857336.779630] 
[1498857336.779630] Kernel panic - not syncing: LBUG
[1498857336.779630] Pid: 57594, comm: lfs Tainted: P ENX 3.0.101-100.1.20170523-nasa #1
[1498857336.779630] Call Trace:
[1498857336.779630] [&amp;lt;ffffffff81004b35&amp;gt;] dump_trace+0x75/0x300
[1498857336.779630] [&amp;lt;ffffffff814786b3&amp;gt;] dump_stack+0x69/0x6f
[1498857336.779630] [&amp;lt;ffffffff8147876f&amp;gt;] panic+0xb6/0x224
[1498857336.779630] [&amp;lt;ffffffffa09dfdc3&amp;gt;] lbug_with_loc+0xa3/0xb0 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09e18a6&amp;gt;] cfs_cpt_spread_node+0xf6/0x130 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa09e0488&amp;gt;] cfs_cpt_malloc+0x18/0x40 [libcfs]
[1498857336.779630] [&amp;lt;ffffffffa0d1d60b&amp;gt;] ptlrpc_prep_set+0x4b/0x310 [ptlrpc]
[1498857336.779630] [&amp;lt;ffffffffa0d238ac&amp;gt;] ptlrpc_queue_wait+0x3c/0x220 [ptlrpc]
[1498857336.779630] [&amp;lt;ffffffffa1086993&amp;gt;] osc_quotactl+0xf3/0x360 [osc]
[1498857336.779630] [&amp;lt;ffffffffa0ecb8ea&amp;gt;] lov_quotactl+0x38a/0x930 [lov]
[1498857336.779630] [&amp;lt;ffffffffa0f2f4d9&amp;gt;] obd_quotactl+0xb9/0x340 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f3552b&amp;gt;] quotactl_ioctl+0x100b/0x15b0 [lustre]
[1498857336.779630] [&amp;lt;ffffffffa0f37a48&amp;gt;] ll_dir_ioctl+0x1908/0x62f0 [lustre]
[1498857336.779630] [&amp;lt;ffffffff8117117b&amp;gt;] do_vfs_ioctl+0x8b/0x3b0
[1498857336.779630] [&amp;lt;ffffffff81171541&amp;gt;] sys_ioctl+0xa1/0xb0
[1498857336.779630] [&amp;lt;ffffffff81483972&amp;gt;] system_call_fastpath+0x16/0x1b
[1498857336.779630] [&amp;lt;0000.7fffed63f9a7&amp;gt;] 0x7fffed63f9a6
All cpus are now in kdb
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>SLES11SP4 with lustre 2.7.3</environment>
        <key id="47692">LU-9843</key>
            <summary> LNetError: 57600:0:(linux-cpu.c:572:cfs_cpt_spread_node()) LBUG</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="sharmaso">Sonia Sharma</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Mon, 7 Aug 2017 21:31:26 +0000</created>
                <updated>Thu, 10 Oct 2019 21:35:18 +0000</updated>
                            <resolved>Thu, 10 Oct 2019 21:35:18 +0000</resolved>
                                    <version>Lustre 2.7.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="204806" author="pjones" created="Tue, 8 Aug 2017 17:38:26 +0000"  >&lt;p&gt;Sonia&lt;/p&gt;

&lt;p&gt;Can you please advise?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="204888" author="sharmaso" created="Wed, 9 Aug 2017 13:53:19 +0000"  >&lt;p&gt;Hi Mahmoud,&lt;br/&gt;
 Can we have access to vmcore and vmlinux for this?&lt;/p&gt;

&lt;p&gt;Thanks!&lt;/p&gt;</comment>
                            <comment id="204929" author="mhanafi" created="Wed, 9 Aug 2017 17:49:21 +0000"  >&lt;p&gt;Unfortunately we were not able to get a crash dump. Only other clue I have, I believe this occurred when one of the OST had hit a bitmap error and was remounted Read-only.&lt;/p&gt;</comment>
                            <comment id="204944" author="sharmaso" created="Wed, 9 Aug 2017 19:34:12 +0000"  >&lt;p&gt;Can you please give details on from where you got the build for&#160;SLES11SP4 with lustre 2.7.3 or did you build yourself?&lt;br/&gt;
 I could not find a branch with tag 2.7.3. Is it the tag in a fe branch?&#160;&lt;/p&gt;</comment>
                            <comment id="204947" author="pjones" created="Wed, 9 Aug 2017 19:58:44 +0000"  >&lt;p&gt;Sonia&lt;/p&gt;

&lt;p&gt;NASA have their own distribution based on the 2.7 FE branch. They will need to grant you access to it on github&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="204955" author="jaylan" created="Wed, 9 Aug 2017 20:38:57 +0000"  >&lt;p&gt;Hi Sonia,&lt;/p&gt;

&lt;p&gt;If you give me your login ID at github.com I can add you to the list with access permission to our FE git repo.&lt;/p&gt;</comment>
                            <comment id="204961" author="sharmaso" created="Wed, 9 Aug 2017 21:01:58 +0000"  >&lt;p&gt;Hi Jay&lt;br/&gt;
My login-id&#160;for github.com is &lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;mailto:soniash24@gmail.com&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;soniash24@gmail.com&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/mail_small.gif&quot; height=&quot;12&quot; width=&quot;13&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt;&#160;(username-Sonia241087)&lt;/p&gt;</comment>
                            <comment id="204965" author="jaylan" created="Wed, 9 Aug 2017 22:23:49 +0000"  >&lt;p&gt;Hi Sonia,&lt;br/&gt;
Have you received invitation from github to join &quot;NASA Earth Exchange (NEX)?&quot; The lustre FE (lustre-nas-fe) repo is housed under NEX. You will join as a member to Lustre team.&lt;/p&gt;</comment>
                            <comment id="204966" author="sharmaso" created="Wed, 9 Aug 2017 22:26:43 +0000"  >&lt;p&gt;Hi Jay&lt;br/&gt;
Yes I am able to access the repo. Thanks&lt;/p&gt;</comment>
                            <comment id="205156" author="sharmaso" created="Fri, 11 Aug 2017 16:01:21 +0000"  >&lt;p&gt;Can we get information on how&#160;many NUMA nodes and CPU cores are there? Also what is the value of&#160;MAX_NUMNODES (&#160;from /proc/self/status, field Mems_allowed)?&lt;/p&gt;</comment>
                            <comment id="205191" author="sharmaso" created="Fri, 11 Aug 2017 19:36:16 +0000"  >&lt;p&gt;Hi Mahmoud,&lt;/p&gt;

&lt;p&gt;Remounting of ost might have exposed a bug in the cfs_cpt_spread_node() code which is the reason it hit LBUG. Here is what happened we think - when ost was remounted, it called function ost_setup() which further called cfs_cpt_nodemask()&#160;and cfs_cpt_set_node() that might change&#160;the mask. This would then expose a race condition, where the mask changes after the rotor has been calculated but before the rotor is checked, causing the LBUG to be hit.&lt;br/&gt;
I will push a patch to branch b2_7_fe to&#160;fix this issue in the code. &lt;br/&gt;
Though, the 2.10 release has the fix and a series of many other patches related to CPT rework code. So it might be a good idea to update to the 2.10 release.&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;</comment>
                            <comment id="205658" author="mhanafi" created="Thu, 17 Aug 2017 18:41:29 +0000"  >&lt;p&gt;2.10 release is a longer term option. For now we will need a 2.7fe patch.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="205660" author="sharmaso" created="Thu, 17 Aug 2017 18:43:28 +0000"  >&lt;p&gt;I have pushed this patch but it still needs to be reviewed and landed.&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/28538&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/28538&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="206047" author="jaylan" created="Tue, 22 Aug 2017 19:04:33 +0000"  >&lt;p&gt;Hi Sonia, there was comments on #28538 from your reviewer. Should I ignore the comments and pick you your patchset #1?&lt;/p&gt;</comment>
                            <comment id="206049" author="sharmaso" created="Tue, 22 Aug 2017 19:09:24 +0000"  >&lt;p&gt;Hi Jay,&lt;/p&gt;

&lt;p&gt;I need to revise the patch but I was waiting for one more reviewer&apos;s (Dmitry&apos;s) feedback on the comments as he had done the major changes related to this fix on master.&#160;&lt;br/&gt;
I will revise it soon and upload a new patch which should anyways fix this particular issue.&lt;/p&gt;</comment>
                            <comment id="206051" author="pjones" created="Tue, 22 Aug 2017 19:13:40 +0000"  >&lt;p&gt;Sonia&lt;/p&gt;

&lt;p&gt;Dmitry is out of the office this week so I recommend refreshing with Amir&apos;s comments and then getting Dmitry&apos;s input upon his return&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="206053" author="sharmaso" created="Tue, 22 Aug 2017 19:21:46 +0000"  >&lt;p&gt;Sure. I refreshed the patch per Amir&apos;s comments.&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;</comment>
                            <comment id="206880" author="jaylan" created="Tue, 29 Aug 2017 21:11:40 +0000"  >&lt;p&gt;Does 2.10.0 need this patch? Thanks!&lt;/p&gt;</comment>
                            <comment id="206889" author="sharmaso" created="Tue, 29 Aug 2017 22:21:14 +0000"  >&lt;p&gt;2.10.0 doesn&apos;t need this patch as it had a series of patches related to cpt rework which already incorporated this fix.&lt;/p&gt;</comment>
                            <comment id="206985" author="jaylan" created="Wed, 30 Aug 2017 18:44:21 +0000"  >&lt;p&gt;Sorry I forgot to ask if the patch is needed for 2.9.0. We have lustre clients running 2.7.3, 2.9.0 and 2.10.0. Please advise. Thanks!&lt;/p&gt;</comment>
                            <comment id="207081" author="sharmaso" created="Thu, 31 Aug 2017 16:20:59 +0000"  >&lt;p&gt;Yes 2.9.0 would also require this patch.&lt;/p&gt;</comment>
                            <comment id="256204" author="mhanafi" created="Thu, 10 Oct 2019 21:28:27 +0000"  >&lt;p&gt;please close we are no longer running 2.7&lt;/p&gt;</comment>
                            <comment id="256205" author="pjones" created="Thu, 10 Oct 2019 21:35:18 +0000"  >&lt;p&gt;ok - thanks&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzi0f:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>