<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:10:57 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14578] LustreError: 25433:0:(tgt_grant.c:223:tgt_grant_sanity_check()) LBUG</title>
                <link>https://jira.whamcloud.com/browse/LU-14578</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This filesystem has 2 servers and both hit LBUG&lt;/p&gt;

&lt;p&gt;First one&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
[4308300.501701] LustreError: 17867:0:(tgt_grant.c:463:tgt_grant_space_left()) nbp12-OST0000: cli 55a893a2-37fc-a91e-0edd-c13e39c0bcd7/ffff93b5024b4000 left 51980938248192 &amp;lt; tot_grant 4611686279107159457 unstable 85434368 pending 90030080 dirty 390602752
[4308300.568648] LustreError: 17867:0:(tgt_grant.c:463:tgt_grant_space_left()) Skipped 69 previous similar messages
[4308305.988484] LustreError: 80109:0:(tgt_grant.c:463:tgt_grant_space_left()) nbp12-OST0000: cli ba1ae12e-b75a-7684-bce5-34097cf4072c/ffff93b488caa400 left 51980913885184 &amp;lt; tot_grant 4611686277031540129 unstable 0 pending 0 dirty 344813568
[4308306.051765] LustreError: 80109:0:(tgt_grant.c:463:tgt_grant_space_left()) Skipped 44 previous similar messages
[4308314.057174] LustreError: 86494:0:(tgt_grant.c:463:tgt_grant_space_left()) nbp12-OST0000: cli b5875278-4309-10d6-2c2d-557864167838/ffff93a576975c00 left 51980868866048 &amp;lt; tot_grant 4611686246882669986 unstable 27496448 pending 31715328 dirty 373313536
[4308314.124119] LustreError: 86494:0:(tgt_grant.c:463:tgt_grant_space_left()) Skipped 38 previous similar messages
[4308330.021959] LustreError: 17949:0:(tgt_grant.c:463:tgt_grant_space_left()) nbp12-OST0000: cli fcefe8b5-bf4c-3d12-56f9-fb1b93134dfc/ffff939c3f41a800 left 51980592369664 &amp;lt; tot_grant 4611686224816031140 unstable 25616384 pending 25669632 dirty 388505600
[4308330.088908] LustreError: 17949:0:(tgt_grant.c:463:tgt_grant_space_left()) Skipped 183 previous similar messages
[4308337.687240] LustreError: 19209:0:(tgt_grant.c:151:tgt_check_export_grants()) nbp12-OST0000: cli 5fc11b40-37df-3838-564b-bfebf0abf25a/ffff93ad4aeb9000 ted_grant(4611686037896666112) + ted_pending(0) &amp;gt; maxsize(77690215612416)
[4308337.747390] LustreError: 19209:0:(tgt_grant.c:223:tgt_grant_sanity_check()) LBUG
[4308337.749201] LustreError: 25433:0:(tgt_grant.c:223:tgt_grant_sanity_check()) LBUG
[4308337.749203] Pid: 25433, comm: kworker/11:0 3.10.0-1127.19.1.el7_lustre2125.x86_64 #1 SMP Mon Nov 2 14:50:02 PST 2020
[4308337.749203] Call Trace:
[4308337.749221]&#160; [&amp;lt;ffffffffc09f67cc&amp;gt;] libcfs_call_trace+0x8c/0xc0 [libcfs]
[4308337.749225]&#160; [&amp;lt;ffffffffc09f687c&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
[4308337.749275]&#160; [&amp;lt;ffffffffc135aa20&amp;gt;] tgt_grant_sanity_check+0x520/0x560 [ptlrpc]
[4308337.749281]&#160; [&amp;lt;ffffffffc18dccd8&amp;gt;] ofd_destroy_export+0x88/0x110 [ofd]
[4308337.749304]&#160; [&amp;lt;ffffffffc0e2459e&amp;gt;] class_export_destroy+0xee/0x490 [obdclass]
[4308337.749316]&#160; [&amp;lt;ffffffffc0e24955&amp;gt;] obd_zombie_exp_cull+0x15/0x20 [obdclass]
[4308337.749319]&#160; [&amp;lt;ffffffffa28be6bf&amp;gt;] process_one_work+0x17f/0x440
[4308337.749321]&#160; [&amp;lt;ffffffffa28bf7d6&amp;gt;] worker_thread+0x126/0x3c0
[4308337.749323]&#160; [&amp;lt;ffffffffa28c6691&amp;gt;] kthread+0xd1/0xe0
[4308337.749325]&#160; [&amp;lt;ffffffffa2f92d1d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[4308337.749340]&#160; [&amp;lt;ffffffffffffffff&amp;gt;] 0xffffffffffffffff
[4308337.749341] Kernel panic - not syncing: LBUG
[4308337.749343] CPU: 11 PID: 25433 Comm: kworker/11:0 Kdump: loaded Tainted: G &#160; &#160; &#160; &#160; &#160; OE&#160; ------------ &#160; 3.10.0-1127.19.1.el7_lustre2125.x86_64 #1
[4308337.749343] Hardware name: HPE ProLiant DL380 Gen10/ProLiant DL380 Gen10, BIOS U30 06/15/2018
[4308337.749356] Workqueue: obd_zombid obd_zombie_exp_cull [obdclass]
[4308337.749356] Call Trace:
[4308337.749360]&#160; [&amp;lt;ffffffffa2f7ffa5&amp;gt;] dump_stack+0x19/0x1b
[4308337.749362]&#160; [&amp;lt;ffffffffa2f79541&amp;gt;] panic+0xe8/0x21f
[4308337.749367]&#160; [&amp;lt;ffffffffc09f68cb&amp;gt;] lbug_with_loc+0x9b/0xa0 [libcfs]
[4308337.749399]&#160; [&amp;lt;ffffffffc135aa20&amp;gt;] tgt_grant_sanity_check+0x520/0x560 [ptlrpc]
[4308337.749403]&#160; [&amp;lt;ffffffffc18dccd8&amp;gt;] ofd_destroy_export+0x88/0x110 [ofd]
[4308337.749416]&#160; [&amp;lt;ffffffffc0e2459e&amp;gt;] class_export_destroy+0xee/0x490 [obdclass]
[4308337.749428]&#160; [&amp;lt;ffffffffc0e24955&amp;gt;] obd_zombie_exp_cull+0x15/0x20 [obdclass]
[4308337.749430]&#160; [&amp;lt;ffffffffa28be6bf&amp;gt;] process_one_work+0x17f/0x440
[4308337.749431]&#160; [&amp;lt;ffffffffa28bf7d6&amp;gt;] worker_thread+0x126/0x3c0
[4308337.749433]&#160; [&amp;lt;ffffffffa28bf6b0&amp;gt;] ? manage_workers.isra.26+0x2a0/0x2a0
[4308337.749434]&#160; [&amp;lt;ffffffffa28c6691&amp;gt;] kthread+0xd1/0xe0
[4308337.749436]&#160; [&amp;lt;ffffffffa28c65c0&amp;gt;] ? insert_kthread_work+0x40/0x40
[4308337.749437]&#160; [&amp;lt;ffffffffa2f92d1d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[4308337.749438]&#160; [&amp;lt;ffffffffa28c65c0&amp;gt;] ? insert_kthread_work+0x40/0x40
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Second one &lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
[3879290.271375] LustreError: 16716:0:(tgt_grant.c:463:tgt_grant_space_left()) nbp12-OST000b: cli ad8e8405-8dcc-dcec-4983-af2b3509ed40/ffff9a21dd688400 left 51431169011712 &amp;lt; tot_grant 4611686156105684284 unstable 0 pending 0 dirty 55066624
[3879290.334406] LustreError: 16716:0:(tgt_grant.c:463:tgt_grant_space_left()) Skipped 6 previous similar messages
[3879348.214404] LustreError: 87087:0:(tgt_grant.c:151:tgt_check_export_grants()) nbp12-OST000b: cli 5fc11b40-37df-3838-564b-bfebf0abf25a/ffff9a32405cac00 ted_grant(4611686037969102848) + ted_pending(0) &amp;gt; maxsize(77690215612416)
[3879348.274549] LustreError: 87087:0:(tgt_grant.c:223:tgt_grant_sanity_check()) LBUG
[3879348.297309] Pid: 87087, comm: kworker/17:3 3.10.0-1127.19.1.el7_lustre2125.x86_64 #1 SMP Mon Nov 2 14:50:02 PST 2020
[3879348.297314] Call Trace:
[3879348.297326]  [&amp;lt;ffffffffc0b447cc&amp;gt;] libcfs_call_trace+0x8c/0xc0 [libcfs]
[3879348.302057]  
[3879348.302061] [&amp;lt;ffffffffc0b4487c&amp;gt;] lbug_with_loc+0x4c/0xa0 [libcfs]
[3879348.302061]  
[3879348.302107] [&amp;lt;ffffffffc15d6a20&amp;gt;] tgt_grant_sanity_check+0x520/0x560 [ptlrpc]
[3879348.302113]  [&amp;lt;ffffffffc125ecd8&amp;gt;] ofd_destroy_export+0x88/0x110 [ofd]
[3879348.302133]  [&amp;lt;ffffffffc0f8f59e&amp;gt;] class_export_destroy+0xee/0x490 [obdclass]
[3879348.302145]  [&amp;lt;ffffffffc0f8f955&amp;gt;] obd_zombie_exp_cull+0x15/0x20 [obdclass]
[3879348.302149]  [&amp;lt;ffffffffaccbe6bf&amp;gt;] process_one_work+0x17f/0x440
[3879348.302150]  [&amp;lt;ffffffffaccbf7d6&amp;gt;] worker_thread+0x126/0x3c0
[3879348.302152]  [&amp;lt;ffffffffaccc6691&amp;gt;] kthread+0xd1/0xe0
[3879348.302154]  [&amp;lt;ffffffffad392d1d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[3879348.302169]  [&amp;lt;ffffffffffffffff&amp;gt;] 0xffffffffffffffff
[3879348.302170] Kernel panic - not syncing: LBUG
[3879348.302172] CPU: 17 PID: 87087 Comm: kworker/17:3 Kdump: loaded Tainted: G           OE  ------------   3.10.0-1127.19.1.el7_lustre2125.x86_64 #1
[3879348.302172] Hardware name: HPE ProLiant DL380 Gen10/ProLiant DL380 Gen10, BIOS U30 06/15/2018
[3879348.302185] Workqueue: obd_zombid obd_zombie_exp_cull [obdclass]
[3879348.302185] Call Trace:
[3879348.302188]  [&amp;lt;ffffffffad37ffa5&amp;gt;] dump_stack+0x19/0x1b
[3879348.302190]  [&amp;lt;ffffffffad379541&amp;gt;] panic+0xe8/0x21f
[3879348.302196]  [&amp;lt;ffffffffc0b448cb&amp;gt;] lbug_with_loc+0x9b/0xa0 [libcfs]
[3879348.302227]  [&amp;lt;ffffffffc15d6a20&amp;gt;] tgt_grant_sanity_check+0x520/0x560 [ptlrpc]
[3879348.302231]  [&amp;lt;ffffffffc125ecd8&amp;gt;] ofd_destroy_export+0x88/0x110 [ofd]
[3879348.302243]  [&amp;lt;ffffffffc0f8f59e&amp;gt;] class_export_destroy+0xee/0x490 [obdclass]
[3879348.302255]  [&amp;lt;ffffffffc0f8f955&amp;gt;] obd_zombie_exp_cull+0x15/0x20 [obdclass]
[3879348.302257]  [&amp;lt;ffffffffaccbe6bf&amp;gt;] process_one_work+0x17f/0x440
[3879348.302258]  [&amp;lt;ffffffffaccbf7d6&amp;gt;] worker_thread+0x126/0x3c0
[3879348.302260]  [&amp;lt;ffffffffaccbf6b0&amp;gt;] ? manage_workers.isra.26+0x2a0/0x2a0
[3879348.302261]  [&amp;lt;ffffffffaccc6691&amp;gt;] kthread+0xd1/0xe0
[3879348.302263]  [&amp;lt;ffffffffaccc65c0&amp;gt;] ? insert_kthread_work+0x40/0x40
[3879348.302264]  [&amp;lt;ffffffffad392d1d&amp;gt;] ret_from_fork_nospec_begin+0x7/0x21
[3879348.302265]  [&amp;lt;ffffffffaccc65c0&amp;gt;] ? insert_kthread_work+0x40/0x40
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="63624">LU-14578</key>
            <summary>LustreError: 25433:0:(tgt_grant.c:223:tgt_grant_sanity_check()) LBUG</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="2">Won&apos;t Fix</resolution>
                                        <assignee username="tappro">Mikhail Pershin</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Thu, 1 Apr 2021 18:19:47 +0000</created>
                <updated>Thu, 29 Jun 2023 02:33:55 +0000</updated>
                            <resolved>Mon, 17 Jan 2022 11:39:13 +0000</resolved>
                                    <version>Lustre 2.12.5</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>6</watches>
                                                                            <comments>
                            <comment id="297586" author="pjones" created="Thu, 1 Apr 2021 18:25:37 +0000"  >&lt;p&gt;Mike&lt;/p&gt;

&lt;p&gt;I believe that you&apos;ve looked into some issues in this area recently. What do you advise here?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="297686" author="tappro" created="Fri, 2 Apr 2021 15:24:52 +0000"  >&lt;p&gt;It looks like grants were overflow at some point causing &lt;tt&gt;tot_grant&lt;/tt&gt; to become too large. I will check known issues first&lt;/p&gt;</comment>
                            <comment id="322896" author="tappro" created="Mon, 17 Jan 2022 11:39:13 +0000"  >&lt;p&gt;problem should be solved in the latest 2.12 releases&lt;/p&gt;</comment>
                            <comment id="376850" author="qian_wc" created="Thu, 29 Jun 2023 02:33:55 +0000"  >&lt;p&gt;+1 on master: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/93a6a37b-819c-44d2-b248-8fc24bc85404&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/93a6a37b-819c-44d2-b248-8fc24bc85404&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01r67:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>