<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:11:09 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14600] sanity-lfsck test_30: f0 is not recovered</title>
                <link>https://jira.whamcloud.com/browse/LU-14600</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Andreas Dilger  &amp;lt;adilger@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/84000ede-1df1-4f8f-90a0-44f5afc1ea05&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/84000ede-1df1-4f8f-90a0-44f5afc1ea05&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_30 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;stat: cannot stat &apos;/mnt/lustre/d30.sanity-lfsck/foo/f0&apos;: No such file or directory
(18) f0 is not recovered
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This only started failing on 2021-04-08, so is very likely a regression due to a recent landing. &lt;/p&gt;





&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
sanity-lfsck test_30 - (18) f0 is not recovered&lt;/p&gt;</description>
                <environment></environment>
        <key id="63725">LU-14600</key>
            <summary>sanity-lfsck test_30: f0 is not recovered</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="adilger">Andreas Dilger</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Fri, 9 Apr 2021 15:28:31 +0000</created>
                <updated>Fri, 16 Apr 2021 23:40:16 +0000</updated>
                            <resolved>Fri, 16 Apr 2021 07:02:28 +0000</resolved>
                                                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="298388" author="adilger" created="Fri, 9 Apr 2021 15:42:57 +0000"  >&lt;p&gt;What is very strange is that this failure started happening on several different branches on the same day - master, b2_12, b_es5_2, and b_es6_0, which makes it unlikely (though not impossible) to be caused by the same patch landing on all three branches at once. &lt;/p&gt;

&lt;p&gt;&lt;del&gt;Testing on 2021-04-09 looks like it has started passing again&lt;/del&gt;, so it is &lt;em&gt;possible&lt;/em&gt; it was some kind of date-related bug (unlikely, but it happened with &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-13314&quot; title=&quot;sanity test_56ob: lfs find /mnt/lustre/d56ob.sanity -mtime 1y&amp;#39; wrong: found 0, expected 1&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-13314&quot;&gt;&lt;del&gt;LU-13314&lt;/del&gt;&lt;/a&gt;), or a strange hiccup in the test environment that only caused this particular test to fail that day?&lt;/p&gt;</comment>
                            <comment id="298508" author="arshad512" created="Mon, 12 Apr 2021 04:31:37 +0000"  >&lt;p&gt;Seen on master. &lt;a href=&quot;https://testing.whamcloud.com/test_sets/6fd26096-1e3c-4fbc-8685-d79e6f682975&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/6fd26096-1e3c-4fbc-8685-d79e6f682975&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="298630" author="eaujames" created="Tue, 13 Apr 2021 07:12:21 +0000"  >&lt;p&gt;Seen on b2_12:&#160; &lt;a href=&quot;https://testing.whamcloud.com/test_sessions/0b38adbc-8f78-4b49-8163-19007be5e8c7&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sessions/0b38adbc-8f78-4b49-8163-19007be5e8c7&lt;/a&gt;&lt;font color=&quot;#2e3436&quot;&gt;&#160;&lt;/font&gt;&lt;br/&gt;
&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160;&#160; &lt;a href=&quot;https://testing.whamcloud.com/test_sessions/eb8ea52e-1afe-4364-956f-1d424be88c97&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sessions/eb8ea52e-1afe-4364-956f-1d424be88c97&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="298807" author="adilger" created="Wed, 14 Apr 2021 20:07:45 +0000"  >&lt;p&gt;This patch only started failing on 2021-04-08, and this is now a 100% failure for &lt;tt&gt;review-dne-part-2&lt;/tt&gt; and &lt;tt&gt;full&lt;/tt&gt; sessions for both master and b2_12 (the &lt;tt&gt;review-dne-zfs-part-2&lt;/tt&gt; sessions are passing because this test is ldiskfs-only).&lt;/p&gt;

&lt;p&gt;There were several patches landed to b2_12 on 2021-04-06:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;f735003c0f LU-14355 ptlrpc: do not output error when imp_sec is freed
0596a16841 LU-12506 changelog: support large number of MDT
7f04890a1b LU-13609 mgs: fix config_log buffer handling
0850c7b14a LU-13649 mdd: orhpan cleanup fix
5610ef9a7a LU-1538 tests: standardize test script init - sanity
7531c5d25c LU-14450 kernel: kernel update RHEL8.3 [4.18.0-240.15.1.el8_3]
2fd278af4c LU-11518 ldlm: lru code cleanup
eaee7c3cd6 LU-11518 osc: cancel osc_lock list traversal once found the lock is being used 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;Patches landed to master on 2021-04-06 are:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;622e4c6e04 LU-14547 test: skip sanityn 109 for local setup
14a1102268 LU-14552 ptlrpc: NULL pointer dereference in ptlrpc_watchdog_fire
f9d837b479 LU-14540 o2iblnd: Use REMOTE_DROPPED for ECONNREFUSED
3f8a6fd7d6 LU-14538 gss: make namespace optional in lgss_keyring
9cc7128b9b LU-14522 ldlm: reprocess locks if enqueue failed
1d3c585194 LU-14487 lustre: remove references to Sun Trademark.
642682a39e LU-14450 kernel: kernel update RHEL8.3 [4.18.0-240.15.1.el8_3]
f37bce8a57 LU-14119 osd: add mount option &quot;resetoi&quot;
99d00b97ef LU-14119 osd: delete stale OI mapping entry
f5136e8195 LU-14119 osd-zfs: enable LUDA_VERIFY
bf47526261 LU-14119 mdc: set fid2path RPC interruptible
771308ada3 LU-14291 ptlrpc: format UPDATE messages in server-only code
67d17dd590 LU-14195 libcfs: switch to kfree_sensitive
d7249d9d70 LU-13783 libcfs: provide fallback kallsyms_lookup_name()
3d101645a5 LU-14132 lod: do not initialize sub llogs twice
00141b1a74 LU-11776 utils: add support lfs find with mdt hash flag
4126fbb30c LU-13397 lfs: mirror resync to keep sparseness
77f5bb4dac LU-6142 lustre: convert IFTODT to S_DT
f38f09e02a LU-14090 mgs: no local logs flag
2a34dc95bd LU-12142 clio: fix hang on urgent cached pages
1058867c00 LU-12142 readahead: limit over reservation
b4391fcdaf LU-10632 tests: recovery-small test_26 idle_timeout
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;so the only common patch between these two branches is the &lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14450&quot; title=&quot;kernel update [RHEL8.3 4.18.0-240.15.1.el8_3]&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14450&quot;&gt;&lt;del&gt;LU-14450&lt;/del&gt;&lt;/a&gt; kernel: kernel update RHEL8.3 &lt;span class=&quot;error&quot;&gt;&amp;#91;4.18.0-240.15.1.el8_3&amp;#93;&lt;/span&gt;&lt;/tt&gt; patch (update from kernel 4.18.0-240.1.1.el8), but that is only affecting the &lt;b&gt;client&lt;/b&gt; for b2_12 testing.&lt;/p&gt;

&lt;p&gt;Comparing the test environment for the last passing and first failing run on b2_12 shows the server kernel version is different:&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;https://testing.whamcloud.com/test_sessions/b4203201-088d-47c8-87be-e08ef8e31cf1|2021-04-07 05:11:32&amp;#93;&lt;/span&gt;: pass Kernel version	3.10.0-1160.15.2.el7_lustre.x86_64&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;https://testing.whamcloud.com/test_sessions/bb45aa98-1c36-492d-a0f6-4b61135fae40|2021-04-09 22:57:14&amp;#93;&lt;/span&gt;: fail Kernel version	3.10.0-1160.21.1.el7_lustre.x86_64&lt;/p&gt;

&lt;p&gt;However, on master, both the passing and failing runs are using the same RHEL8 kernel on the servers:&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;https://testing.whamcloud.com/test_sessions/e72881e6-7c88-4fe3-888c-a431d2ad5810|2021-04-08 04:23:19&amp;#93;&lt;/span&gt;:pass Kernel version	4.18.0-240.15.1.el8_lustre.x86_64&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;https://testing.whamcloud.com/test_sessions/94bf8f9f-b129-46aa-bdde-8405a3216f63|2021-04-08 11:00:47&amp;#93;&lt;/span&gt; Kernel version	4.18.0-240.15.1.el8_lustre.x86_64&lt;/p&gt;

&lt;p&gt;so it looks like this is caused somehow by a test environment change that happened on 2021-04-08 between 04:23-11:00.&lt;/p&gt;</comment>
                            <comment id="298809" author="adilger" created="Wed, 14 Apr 2021 20:30:37 +0000"  >&lt;p&gt;The only other common element among the test sessions is e2fsprogs, and it appears that the landing of patch &lt;a href=&quot;https://review.whamcloud.com/43169&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43169&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11446&quot; title=&quot;ldiskfs inodes nlink mismatch with DNE&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11446&quot;&gt;LU-11446&lt;/a&gt; e2fsck: check trusted.link when fixing nlink&lt;/tt&gt;&quot; has caused this test to start failing.&lt;/p&gt;

&lt;p&gt;The passing sessions are reporting e2fsprogs with &quot;&lt;tt&gt;e2fsck 1.45.6.wc5 (09-Feb-2021)&lt;/tt&gt;&quot; and failing ones report &quot;&lt;tt&gt;e2fsck 1.45.6.wc6 (09-Apr-2021)&lt;/tt&gt;&quot;.&lt;/p&gt;

&lt;p&gt;Reading the test description for &lt;tt&gt;sanity-lfsck.sh::test_30()&lt;/tt&gt; makes it clear that this is the cause, because the fix to &lt;tt&gt;e2fsck&lt;/tt&gt; is specifically to &lt;b&gt;avoid&lt;/b&gt; the entry being moved to &lt;tt&gt;lost+found&lt;/tt&gt;:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Inject failure stub on MDT0 to simulate the case that
directory d0 has no linkEA entry, then the LFSCK will
move it into .lustre/lost+found/MDTxxxx/ later.
:
 Pass 4: Checking reference counts
-Unattached inode 183
-Connect to /lost+found? yes
-
-Inode 183 ref count is 2, should be 1.  Fix? yes
-
 Unattached inode 187
 Connect to /lost+found? yes
 
 Inode 187 ref count is 2, should be 1.  Fix? yes

-Unattached inode 192
-Connect to /lost+found? yes
-
-Inode 192 ref count is 2, should be 1.  Fix? yes
-
-Unattached inode 193
-Connect to /lost+found? yes
-
-Inode 193 ref count is 2, should be 1.  Fix? yes
-
 Unattached inode 199
 Connect to /lost+found? yes
 
 Inode 199 ref count is 2, should be 1.  Fix? yes
 
 Inode 20106 ref count is 1, should be 2.  Fix? yes
 
 Inode 20108 ref count is 3, should be 2.  Fix? yes
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="298828" author="adilger" created="Thu, 15 Apr 2021 02:45:04 +0000"  >&lt;p&gt;Andreas Dilger (adilger@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/43324&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43324&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14600&quot; title=&quot;sanity-lfsck test_30: f0 is not recovered&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14600&quot;&gt;&lt;del&gt;LU-14600&lt;/del&gt;&lt;/a&gt; e2fsck: check trusted.link after linking inode&lt;br/&gt;
Project: tools/e2fsprogs&lt;br/&gt;
Branch: master-lustre&lt;br/&gt;
Current Patch Set: 2&lt;br/&gt;
Commit: b83f196e93f3cb982f720aeced810cbf650cde04&lt;/p&gt;</comment>
                            <comment id="298847" author="gerrit" created="Thu, 15 Apr 2021 08:29:55 +0000"  >&lt;p&gt;Andreas Dilger (adilger@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/43324/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43324/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14600&quot; title=&quot;sanity-lfsck test_30: f0 is not recovered&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14600&quot;&gt;&lt;del&gt;LU-14600&lt;/del&gt;&lt;/a&gt; e2fsck: check trusted.link after linking inode&lt;br/&gt;
Project: tools/e2fsprogs&lt;br/&gt;
Branch: master-lustre&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 87164b117be3bdeb1becf1960b80687637eda08f&lt;/p&gt;</comment>
                            <comment id="298924" author="adilger" created="Thu, 15 Apr 2021 18:29:34 +0000"  >&lt;p&gt;This patch appears to have fixed the problem - all four review-dne-part-2 sanity-lfsck runs started after 4am MT have passed. &lt;/p&gt;

&lt;p&gt;What is still needed here is an e2fsck test case for this - unreferenced inodes with xattrs that need to be relinked to lost+found. &lt;/p&gt;</comment>
                            <comment id="298952" author="gerrit" created="Thu, 15 Apr 2021 23:55:29 +0000"  >&lt;p&gt;Andreas Dilger (adilger@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/43335&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43335&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14600&quot; title=&quot;sanity-lfsck test_30: f0 is not recovered&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14600&quot;&gt;&lt;del&gt;LU-14600&lt;/del&gt;&lt;/a&gt; e2fsck: trusted.link unref inode test case&lt;br/&gt;
Project: tools/e2fsprogs&lt;br/&gt;
Branch: master-lustre&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: e12d23d0241a1d09e05c1ef129f201c8c1515ffa&lt;/p&gt;</comment>
                            <comment id="298972" author="gerrit" created="Fri, 16 Apr 2021 06:36:46 +0000"  >&lt;p&gt;Andreas Dilger (adilger@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/43335/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43335/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14600&quot; title=&quot;sanity-lfsck test_30: f0 is not recovered&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14600&quot;&gt;&lt;del&gt;LU-14600&lt;/del&gt;&lt;/a&gt; e2fsck: trusted.link unref inode test case&lt;br/&gt;
Project: tools/e2fsprogs&lt;br/&gt;
Branch: master-lustre&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: f46cb5c041147772639c56d993a4313e2655399d&lt;/p&gt;</comment>
                            <comment id="298974" author="adilger" created="Fri, 16 Apr 2021 07:02:00 +0000"  >&lt;p&gt;Fixed in 1.45.6.wc7&lt;/p&gt;</comment>
                            <comment id="299075" author="gerrit" created="Fri, 16 Apr 2021 23:40:16 +0000"  >&lt;p&gt;Andreas Dilger (adilger@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/43352&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/43352&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14600&quot; title=&quot;sanity-lfsck test_30: f0 is not recovered&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14600&quot;&gt;&lt;del&gt;LU-14600&lt;/del&gt;&lt;/a&gt; misc: update to e2fsprogs-1.45.6.wc7&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 1538b8f6d8c31143e059dc95c3724d01d9f93a13&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="53452">LU-11446</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01rsf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>