<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:34:15 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10349] debug and cleanup of corrupted PFID, unmatched MDT-object and OST-object pairs</title>
                <link>https://jira.whamcloud.com/browse/LU-10349</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This ticket is created to handle NASA-specific debugging of corrupted PFIDs discussed in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10248&quot; title=&quot;Need to update PFID of OST objects after layout change&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10248&quot;&gt;&lt;del&gt;LU-10248&lt;/del&gt;&lt;/a&gt;, as well as ensure ports of a fix for lfsck handling of repaired_unmatched_pair, and any other related questions to ensure proper running of lfsck and cleanup of the filesystem.&lt;/p&gt;

&lt;p&gt;servers: lustre-2.7.3-1nasS_mofed33v3g_2.6.32_642.15.1.el6.20170609.x86_64.lustre273.x86_64 (basically the old FE branch, plus several cherry-picked patches)&lt;/p&gt;

&lt;p&gt;clients: lustre-client-2.9.0-2.3nasC_mofed34v1_4.4.74_92.32.1.20170808_nasa.x86_64&lt;/p&gt;

&lt;p&gt;We hope to upgrade both to a 2.10.2-based build in the near future.&lt;/p&gt;</description>
                <environment>servers: lustre-2.7.3-1nasS_mofed33v3g_2.6.32_642.15.1.el6.20170609.x86_64.lustre273.x86_64&lt;br/&gt;
clients: lustre-client-2.9.0-2.3nasC_mofed34v1_4.4.74_92.32.1.20170808_nasa.x86_64</environment>
        <key id="49641">LU-10349</key>
            <summary>debug and cleanup of corrupted PFID, unmatched MDT-object and OST-object pairs</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="yong.fan">nasf</assignee>
                                    <reporter username="ndauchy">Nathan Dauchy</reporter>
                        <labels>
                    </labels>
                <created>Thu, 7 Dec 2017 16:53:31 +0000</created>
                <updated>Mon, 26 Mar 2018 12:34:40 +0000</updated>
                            <resolved>Mon, 26 Mar 2018 12:34:40 +0000</resolved>
                                    <version>Lustre 2.7.0</version>
                    <version>Lustre 2.9.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="215572" author="ndauchy" created="Thu, 7 Dec 2017 17:03:03 +0000"  >&lt;p&gt;At this time, it sounds like we should go with &quot;choice 2&quot; in the comment from nasf:&lt;br/&gt;
&lt;a href=&quot;https://jira.hpdd.intel.com/browse/LU-10248?focusedCommentId=215528&amp;amp;page=com.atlassian.jira.plugin.system.issuetabpanels%3Acomment-tabpanel#comment-215528&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://jira.hpdd.intel.com/browse/LU-10248?focusedCommentId=215528&amp;amp;page=com.atlassian.jira.plugin.system.issuetabpanels%3Acomment-tabpanel#comment-215528&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;We will leave the inconsistencies the way they are until the lfsck patch is available and we can upgrade the servers to include it.&lt;/p&gt;

&lt;p&gt;The only caveat is that we will be continuing to drain and completely remove multiple OSTs from this file system (to free up the hardware for spares) and I want to make sure that won&apos;t combine with the PFID issues and confuse lfsck.  One OST is already gone, and the last dry-run lfsck did not appear to die on it so hopefully we are OK on that front... it&apos;s just the debug logs getting overwritten with the repaired_inconsistent_owner errors might have masked other problems.  Please let me know ASAP if I should &lt;b&gt;not&lt;/b&gt; remove additional OSTs.&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="215575" author="pjones" created="Thu, 7 Dec 2017 17:21:44 +0000"  >&lt;p&gt;Fan Yong is already assisting here&lt;/p&gt;</comment>
                            <comment id="215640" author="yong.fan" created="Fri, 8 Dec 2017 05:05:09 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=ndauchy&quot; class=&quot;user-hover&quot; rel=&quot;ndauchy&quot;&gt;ndauchy&lt;/a&gt;, would you please to check whether or not your branch has the following two patches:&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/#/c/16135/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/16135/&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/#/c/30447/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/30447/&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;If not, please try to apply them and re-run the dryun mode layout LFSCK? Thanks!&lt;/p&gt;</comment>
                            <comment id="215661" author="ndauchy" created="Fri, 8 Dec 2017 15:14:46 +0000"  >&lt;p&gt;Since we are based on 2.7.3 FE branch, I&apos;m pretty confident we have the first of those patches, but not the second since it looks like you just created the backport (and it failed a build test).  Will confirm though.&lt;/p&gt;

&lt;p&gt;Regardless, it will be a while before we can complete the server rebuild and take a downtime to apply it.  In the meantime I need to move forward with removing additional OSTs from the file system to free up the hardware for spares.  Do you recommend we run the current lfsck in non-dry-run mode, or just go ahead and remove the OST now and wait for the lfsck updates?&lt;/p&gt;

&lt;p&gt;Thanks!&lt;/p&gt;</comment>
                            <comment id="215828" author="jaylan" created="Fri, 8 Dec 2017 19:43:23 +0000"  >&lt;p&gt;We do not have either.&lt;/p&gt;

&lt;p&gt;Review #16135 is in &apos;Need Code-Review&apos; state for more than 1 year. Is it OK to cherry-pick as it is, Fan?&lt;/p&gt;</comment>
                            <comment id="216035" author="yong.fan" created="Tue, 12 Dec 2017 10:17:28 +0000"  >&lt;blockquote&gt;
&lt;p&gt;Regardless, it will be a while before we can complete the server rebuild and take a downtime to apply it. In the meantime I need to move forward with removing additional OSTs from the file system to free up the hardware for spares. Do you recommend we run the current lfsck in non-dry-run mode, or just go ahead and remove the OST now and wait for the lfsck updates?&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;There are two kinds inconsistency reported by the layout LFSCK, one is inconsistent owner information that cause by some known layout LFSCK issue, can be ignored. Another is the unmatched MDT-object and OST-object pairs. Such inconsistency will NOT affect normal system access unless enabling I/O verification (disable by default) explicitly. So I would suggest to keep the system unchanged since it is without influence now.&lt;/p&gt;

&lt;blockquote&gt;
&lt;p&gt;Review #16135 is in &apos;Need Code-Review&apos; state for more than 1 year. Is it OK to cherry-pick as it is, Fan?&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;Yes, I think so. Such patch has already been landed to b2_8_fe and master. It is not on b2_7_fe may because b2_7 was some old at that time and such issue is not very serious.&lt;/p&gt;</comment>
                            <comment id="216075" author="ndauchy" created="Tue, 12 Dec 2017 17:51:41 +0000"  >&lt;blockquote&gt;
&lt;p&gt;So I would suggest to keep the system unchanged since it is without influence now.&lt;/p&gt;&lt;/blockquote&gt;
&lt;p&gt;OK, we will proceed with removing the additional OSTs from the file system, and wait for install of the patched lfsck on the 2.7.3 servers and perform the cleanup later.&#160; Thanks!&lt;/p&gt;</comment>
                            <comment id="216843" author="yong.fan" created="Wed, 20 Dec 2017 15:11:23 +0000"  >&lt;p&gt;The patch for repair unexpected inconsistent owner on b2_7_fe:&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/30613&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/30613&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="219231" author="yong.fan" created="Fri, 26 Jan 2018 05:14:50 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=ndauchy&quot; class=&quot;user-hover&quot; rel=&quot;ndauchy&quot;&gt;ndauchy&lt;/a&gt;,&lt;/p&gt;

&lt;p&gt;The patch &lt;a href=&quot;https://review.whamcloud.com/#/c/30612/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/30612/&lt;/a&gt; for fixing the issue of unexpected inconsistent owner has already been landed to master. And it has been ported to b2_7_fe branch via the patch &lt;a href=&quot;https://review.whamcloud.com/30613&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/30613&lt;/a&gt;. You can use related patch to resolve your system trouble. Please let me you what else you need.&lt;/p&gt;</comment>
                            <comment id="219381" author="jaylan" created="Mon, 29 Jan 2018 19:58:54 +0000"  >&lt;p&gt;The above patch #30612 for b2_10 is at&lt;br/&gt;
&lt;a href=&quot;https://review.whamcloud.com/#/c/30628/1&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/30628/1&lt;/a&gt;&lt;br/&gt;
Could you land this?&lt;/p&gt;</comment>
                            <comment id="219387" author="pjones" created="Mon, 29 Jan 2018 20:22:28 +0000"  >&lt;p&gt;Jay&lt;/p&gt;

&lt;p&gt;That is being tracked under &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10422&quot; title=&quot;layout LFSCK try to fix consistent owner unexpectedly&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10422&quot;&gt;&lt;del&gt;LU-10422&lt;/del&gt;&lt;/a&gt; and it will land as soon as the reviews have completed&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="224525" author="pjones" created="Mon, 26 Mar 2018 12:34:40 +0000"  >&lt;p&gt;AFAICT this is now resolved with the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-10422&quot; title=&quot;layout LFSCK try to fix consistent owner unexpectedly&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-10422&quot;&gt;&lt;del&gt;LU-10422&lt;/del&gt;&lt;/a&gt; fix landed to b2_10&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="49954">LU-10422</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="29372">LU-6420</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzoxr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>