<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:26:18 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2568] MDT unable to start with corrupted llog files.</title>
                <link>https://jira.whamcloud.com/browse/LU-2568</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;here is a log from failed mdt start:&lt;/p&gt;

&lt;p&gt;Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5302:0:(llog_lvfs.c:616:llog_lvfs_create()) error looking up logfile 0x7a4801b:0x2790e5b9: rc -116&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5302:0:(llog_cat.c:174:llog_cat_id2handle()) error opening log id 0x7a4801b:2790e5b9: rc -116&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5302:0:(llog_obd.c:318:cat_cancel_cb()) Cannot find handle for log 0x7a4801b&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5248:0:(llog_obd.c:391:llog_obd_origin_setup()) llog_process() with cat_cancel_cb failed: -116&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5248:0:(llog_obd.c:218:llog_setup_named()) obd mdd_obd-content-MDT0000 ctxt 12 lop_setup=ffffffff88625e70 failed -116&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5248:0:(mds_log.c:182:mds_changelog_llog_init()) changelog llog setup failed -116&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5248:0:(mdd_device.c:196:mdd_changelog_llog_init()) no changelog context&lt;br/&gt;
Feb 12 22:04:14 tstmds0a01 kernel: LustreError: 5248:0:(mdd_device.c:271:mdd_changelog_init()) Changelog setup during init failed -22&lt;br/&gt;
Feb 12 22:04:15 tstmds0a01 kernel: Lustre: content-MDT0000: used disk, loading&lt;br/&gt;
Feb 12 22:04:15 tstmds0a01 kernel: LustreError: 5248:0:(mdt_handler.c:1889:mdt_llog_ctxt_clone()) Can&apos;t get mdd ctxt -2&lt;br/&gt;
Feb 12 22:04:15 tstmds0a01 kernel: LustreError: 5248:0:(obd_config.c:522:class_setup()) setup content-MDT0000 failed (-2)&lt;/p&gt;</description>
                <environment></environment>
        <key id="17078">LU-2568</key>
            <summary>MDT unable to start with corrupted llog files.</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="wc-triage">WC Triage</assignee>
                                    <reporter username="zam">Alexander Zarochentsev</reporter>
                        <labels>
                    </labels>
                <created>Thu, 3 Jan 2013 17:16:30 +0000</created>
                <updated>Thu, 9 Jan 2020 06:20:26 +0000</updated>
                            <resolved>Thu, 9 Jan 2020 06:20:26 +0000</resolved>
                                                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="49949" author="zam" created="Fri, 4 Jan 2013 10:52:48 +0000"  >&lt;p&gt;Xyratex has a fix for this issue I will upload it later.&lt;/p&gt;</comment>
                            <comment id="50065" author="tappro" created="Mon, 7 Jan 2013 12:54:49 +0000"  >&lt;p&gt;Zam, this doesn&apos;t look as master bug, is it some older Lustre version than 2.3?&lt;/p&gt;</comment>
                            <comment id="50067" author="zam" created="Mon, 7 Jan 2013 13:37:28 +0000"  >&lt;p&gt;Yes, it is older bug. but looks like it is still in master. &lt;/p&gt;

&lt;p&gt;The issue was with missing llog files and their inode numbers were re-used for other objects.&lt;br/&gt;
llog_lvfs_create returns ESTATE in that case &amp;#8211; it is the error seen at the top level.&lt;/p&gt;

&lt;p&gt;The key fix was:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;diff --git a/lustre/obdclass/llog_lvfs.c b/lustre/obdclass/llog_lvfs.c
index 0987020..60bad4c 100644
--- a/lustre/obdclass/llog_lvfs.c
+++ b/lustre/obdclass/llog_lvfs.c
@@ -615,6 +615,10 @@ &lt;span class=&quot;code-keyword&quot;&gt;static&lt;/span&gt; &lt;span class=&quot;code-object&quot;&gt;int&lt;/span&gt; llog_lvfs_create(struct llog_ctxt *ctxt, struct llog_handle **res,
                         rc = PTR_ERR(dchild);
                         CERROR(&lt;span class=&quot;code-quote&quot;&gt;&quot;error looking up logfile &quot;&lt;/span&gt;LPX64&lt;span class=&quot;code-quote&quot;&gt;&quot;:0x%x: rc %d\n&quot;&lt;/span&gt;,
                                logid-&amp;gt;lgl_oid, logid-&amp;gt;lgl_ogen, rc);
+                        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (rc == -ESTALE)
+                                /* handle reused inode same way as
+                                   non-existing one */
+                                GOTO(out, rc = -ENOENT);
                         GOTO(out, rc);
                 }
 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I still think it is actual for the master branch. but I haven&apos;t tried to re-create it on master.&lt;/p&gt;</comment>
                            <comment id="50103" author="tappro" created="Tue, 8 Jan 2013 03:59:16 +0000"  >&lt;p&gt;the llog_lvfs_create is not used anymore in master, llogs are OSD-based now, do you have any reproducer for this? I suppose it shouldn&apos;t be problem now if the reason was inode re-use because now llog object is fid-based, but we need to check that &lt;/p&gt;</comment>
                            <comment id="260830" author="adilger" created="Thu, 9 Jan 2020 06:20:26 +0000"  >&lt;p&gt;Close old ticket.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvek7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6000</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>