<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:30:20 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16826] MDS nodes panicked running lfsck repair create lost objects: (osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed</title>
                <link>https://jira.whamcloud.com/browse/LU-16826</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Full stack tace is:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[81891.829222] LustreError: 2384348:0:(osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed:
[81891.842752] LustreError: 2384348:0:(osd_handler.c:6260:osd_index_declare_ea_insert()) LBUG
[81891.851987] Pid: 2384348, comm: lfsck_namespace 4.18.0-305.10.2.x6.4.010.32.x86_64 #1 SMP Thu Apr 27 19:48:12 MDT 2023
[81891.863654] Call Trace TBD:
[81891.867456] [&amp;lt;0&amp;gt;] libcfs_call_trace+0x6f/0x90 [libcfs]
[81891.873549] [&amp;lt;0&amp;gt;] lbug_with_loc+0x43/0x80 [libcfs]
[81891.879328] [&amp;lt;0&amp;gt;] osd_index_declare_ea_insert+0x3d4/0x480 [osd_ldiskfs]
[81891.886923] [&amp;lt;0&amp;gt;] lod_sub_declare_insert+0xef/0x240 [lod]
[81891.893314] [&amp;lt;0&amp;gt;] lfsck_namespace_repair_dangling+0xe75/0x1370 [lfsck]
[81891.900770] [&amp;lt;0&amp;gt;] lfsck_namespace_assistant_handler_p1+0x13b1/0x2020 [lfsck]
[81891.908732] [&amp;lt;0&amp;gt;] lfsck_assistant_engine+0x359/0x1c20 [lfsck]
[81891.915378] [&amp;lt;0&amp;gt;] kthread+0x116/0x130
[81891.919931] [&amp;lt;0&amp;gt;] ret_from_fork+0x1f/0x40
[81891.924807] Kernel panic - not syncing: LBUG
[81891.929939] CPU: 24 PID: 2384348 Comm: lfsck_namespace Kdump: loaded Tainted: G           OE    --------- -  - 4.18.0-305.10.2.x6.4.010.32.x86_64 #1
[81891.944936] Hardware name: Viking Enterprise Solutions VSSEP1EC/VSSEP1EC, BIOS RWH3LJ-10.07.00 08/29/2022
[81891.955347] Call Trace:
[81891.958645]  dump_stack+0x5c/0x80
[81891.962787]  panic+0xe7/0x2a9
[81891.966564]  ? ret_from_fork+0x1f/0x40
[81891.971112]  lbug_with_loc.cold.10+0x18/0x18 [libcfs]
[81891.976956]  osd_index_declare_ea_insert+0x3d4/0x480 [osd_ldiskfs]
[81891.983914]  ? osd_index_declare_ea_delete+0x1cd/0x2f0 [osd_ldiskfs]
[81891.991040]  lod_sub_declare_insert+0xef/0x240 [lod]
[81891.996762]  lfsck_namespace_repair_dangling+0xe75/0x1370 [lfsck]
[81892.003700]  ? dt_lookup_dir+0x80/0x190 [obdclass]
[81892.009229]  lfsck_namespace_assistant_handler_p1+0x13b1/0x2020 [lfsck]
[81892.016561]  ? __schedule+0x2cc/0x700
[81892.020938]  lfsck_assistant_engine+0x359/0x1c20 [lfsck]
[81892.026945]  ? __switch_to+0x10c/0x480
[81892.031371]  ? __schedule+0x2cc/0x700
[81892.035689]  ? finish_wait+0x80/0x80
[81892.039917]  ? lfsck_master_engine+0xcd0/0xcd0 [lfsck]
[81892.045680]  kthread+0x116/0x130
[81892.049530]  ? kthread_flush_work_fn+0x10/0x10
[81892.054580]  ret_from_fork+0x1f/0x40 &lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="76035">LU-16826</key>
            <summary>MDS nodes panicked running lfsck repair create lost objects: (osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="zam">Alexander Zarochentsev</assignee>
                                    <reporter username="zam">Alexander Zarochentsev</reporter>
                        <labels>
                    </labels>
                <created>Fri, 12 May 2023 14:34:24 +0000</created>
                <updated>Sat, 23 Dec 2023 01:10:58 +0000</updated>
                            <resolved>Wed, 20 Dec 2023 02:30:22 +0000</resolved>
                                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="372125" author="zam" created="Fri, 12 May 2023 14:41:07 +0000"  >
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
lfsck_namespace_repair_dangling(...):
...
        &lt;span class=&quot;code-comment&quot;&gt;/* 7a. &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; child is remote, delete and insert to generate local agent */&lt;/span&gt;
        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (dt_object_remote(child)) {
                rc = dt_declare_delete(env, parent,
                                       (&lt;span class=&quot;code-keyword&quot;&gt;const&lt;/span&gt; struct dt_key *)lnr-&amp;gt;lnr_name,
                                       th);
                &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (rc)
                        GOTO(stop, rc);

===&amp;gt;        rc = dt_declare_insert(env, parent, (&lt;span class=&quot;code-keyword&quot;&gt;const&lt;/span&gt; struct dt_rec *)rec,
                                       (&lt;span class=&quot;code-keyword&quot;&gt;const&lt;/span&gt; struct dt_key *)lnr-&amp;gt;lnr_name,
                                       th);
                &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (rc)
                        GOTO(stop, rc);
        }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Looks like 7a code path was never called (or the crash has not been reported yet), it misses rec-&amp;gt;ref_fid initialisation before calling dt_declare_insert(), it causes an assertion failure in &lt;br/&gt;
osd_index_declare_ea_insert().&lt;/p&gt;</comment>
                            <comment id="372127" author="gerrit" created="Fri, 12 May 2023 14:44:24 +0000"  >&lt;p&gt;&quot;Alexander Zarochentsev &amp;lt;alexander.zarochentsev@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50980&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50980&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16826&quot; title=&quot;MDS nodes panicked running lfsck repair create lost objects: (osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16826&quot;&gt;&lt;del&gt;LU-16826&lt;/del&gt;&lt;/a&gt; lfsck: init rec_fid before declare_insert&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 5dd21e56cbd9a695bf5444218bdec7206c346afe&lt;/p&gt;</comment>
                            <comment id="372241" author="zam" created="Sun, 14 May 2023 18:48:32 +0000"  >&lt;p&gt;Rerproducer:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
MDSCOUNT=2 sh llmount.sh 

../utils/lfs mkdir -i 0 /mnt/lustre/mdt0dir
../utils/lfs mkdir -i 1 /mnt/lustre/mdt1dir

touch /mnt/lustre/mdt0dir/foo
mv /mnt/lustre/mdt0dir/foo /mnt/lustre/mdt1dir/
FOOFID=$(../utils/lfs path2fid /mnt/lustre/mdt1dir/foo | sed -E &lt;span class=&quot;code-quote&quot;&gt;&apos;s/^.(.*).$/\1/&apos;&lt;/span&gt;)
echo $FOOFID 

sync
umount /mnt/lustre-mds1
umount /mnt/lustre-mds2

echo &lt;span class=&quot;code-quote&quot;&gt;&quot;rm /REMOTE_PARENT_DIR/$FOOFID&quot;&lt;/span&gt; | debugfs -w /dev/mapper/mds1_flakey 

mount -t lustre /dev/mapper/mds1_flakey /mnt/lustre-mds1/
mount -t lustre /dev/mapper/mds2_flakey /mnt/lustre-mds2/

../utils/lctl lfsck_start -M lustre-MDT0000 -C
../utils/lctl lfsck_start -M lustre-MDT0001 -C

&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="372326" author="gerrit" created="Mon, 15 May 2023 17:53:21 +0000"  >&lt;p&gt;&quot;Alexander Zarochentsev &amp;lt;alexander.zarochentsev@hpe.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50998&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50998&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16826&quot; title=&quot;MDS nodes panicked running lfsck repair create lost objects: (osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16826&quot;&gt;&lt;del&gt;LU-16826&lt;/del&gt;&lt;/a&gt; tests: lfsck to repair a dangling remote entry&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: afbf69ada658ca63c7a5953f3de12beb49d3a62b&lt;/p&gt;</comment>
                            <comment id="374013" author="gerrit" created="Wed, 31 May 2023 19:04:05 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50980/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50980/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16826&quot; title=&quot;MDS nodes panicked running lfsck repair create lost objects: (osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16826&quot;&gt;&lt;del&gt;LU-16826&lt;/del&gt;&lt;/a&gt; lfsck: init rec_fid before declare_insert&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 02ac821653a0b2d897442e276d0afc31755064a4&lt;/p&gt;</comment>
                            <comment id="397527" author="gerrit" created="Wed, 20 Dec 2023 01:43:56 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/50998/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/50998/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16826&quot; title=&quot;MDS nodes panicked running lfsck repair create lost objects: (osd_handler.c:6260:osd_index_declare_ea_insert()) ASSERTION( fid != ((void *)0) ) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16826&quot;&gt;&lt;del&gt;LU-16826&lt;/del&gt;&lt;/a&gt; tests: lfsck to repair a dangling remote entry&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 07e02a600e5707de30e1441ce56b68b0cbc3c260&lt;/p&gt;</comment>
                            <comment id="397560" author="pjones" created="Wed, 20 Dec 2023 02:30:22 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="79700">LU-17385</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i03laf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>