<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:37:00 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-3798] replay-single test_86: configuration log errors</title>
                <link>https://jira.whamcloud.com/browse/LU-3798</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Nathaniel Clark &amp;lt;nathaniel.l.clark@intel.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;http://maloo.whamcloud.com/test_sets/ae12d972-092d-11e3-b004-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://maloo.whamcloud.com/test_sets/ae12d972-092d-11e3-b004-52540035b04c&lt;/a&gt;.&lt;/p&gt;

&lt;p&gt;The sub-test test_86 failed with the following error:&lt;/p&gt;
&lt;blockquote&gt;
&lt;p&gt;test_86 failed with 5&lt;/p&gt;&lt;/blockquote&gt;

&lt;p&gt;Info required for matching: replay-single 86&lt;/p&gt;

&lt;p&gt;Client console log:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;02:47:43:if [ $running -eq 0 ] ; then
02:47:43:    mkdir -p /mnt/lustre;
02:47:43:    mount -t lustre -o user_xattr,acl,flock wtm-10vm7@tcp:/lustre /mnt/lustre;
02:47:43:    rc=$?;
02:47:43:fi;
02:47:43:exit $rc
02:47:43:LustreError: 152-6: Ignoring deprecated mount option &apos;acl&apos;.
02:47:43:LustreError: 15c-8: MGC10.10.16.120@tcp: The configuration from log &apos;lustre-client&apos; failed (-5). This may be the result of communication errors between this node and the MGS, a bad configuration, or other errors. See the syslog for more information.
02:47:43:LustreError: 9196:0:(llite_lib.c:1046:ll_fill_super()) Unable to process log: -5
02:47:43:Lustre: Unmounted lustre-client
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="20511">LU-3798</key>
            <summary>replay-single test_86: configuration log errors</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="bogl">Bob Glossman</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                            <label>zfs</label>
                    </labels>
                <created>Tue, 20 Aug 2013 21:17:53 +0000</created>
                <updated>Tue, 14 Dec 2021 22:52:26 +0000</updated>
                            <resolved>Tue, 14 Dec 2021 22:52:26 +0000</resolved>
                                    <version>Lustre 2.5.0</version>
                    <version>Lustre 2.8.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="64761" author="adilger" created="Wed, 21 Aug 2013 17:21:53 +0000"  >&lt;p&gt;I suspect this is some kind of race between mounting the MDS/MGS (which is slow for some reason) and remounting the client but the MGS is not yet ready.  We could have the client retry the mount a couple of times (with &quot;-o retry=5&quot; mount option on the client) to see if that solves the problem?&lt;/p&gt;</comment>
                            <comment id="64766" author="adilger" created="Wed, 21 Aug 2013 17:52:38 +0000"  >&lt;p&gt;It looks like this test only started failing regularly on July 31st (only 4 failures ever before then, maybe once every few months), and has failed fairly consistently since then (40 failures in 21 days), so it is almost certainly a regression landed on 2013-07-31.&lt;/p&gt;

&lt;p&gt;The patch in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3155&quot; title=&quot;Permanent parameters with lctl set_param -P&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3155&quot;&gt;&lt;del&gt;LU-3155&lt;/del&gt;&lt;/a&gt; &lt;a href=&quot;http://review.whamcloud.com/6025&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/6025&lt;/a&gt; would be a prime culprit, since it is one of the major changes to configuration that was landed at that time.  It would be worthwhile to look through the test failures and find the latest commit that is common to all of them.&lt;/p&gt;

&lt;p&gt;The below query finds all of the test_86 failures, then each one needs to go to the main &quot;replay-single&quot; test log, then the specific git commit hash for that test needs to be used to find the &quot;parent&quot; on which the patch was based.  The latest common parent among all the failures (excepting possibly the failing patch itself) is the likely source of the regression.&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://maloo.whamcloud.com/sub_tests/query?commit=Update+results&amp;amp;page=2&amp;amp;sub_test[query_bugs]=&amp;amp;sub_test[status]=FAIL&amp;amp;sub_test[sub_test_script_id]=fcadf0d2-32c3-11e0-a61c-52540025f9ae&amp;amp;test_node[architecture_type_id]=&amp;amp;test_node[distribution_type_id]=&amp;amp;test_node[file_system_type_id]=&amp;amp;test_node[lustre_branch_id]=24a6947e-04a9-11e1-bb5f-52540025f9af&amp;amp;test_node[os_type_id]=&amp;amp;test_node_network[network_type_id]=&amp;amp;test_session[query_date]=&amp;amp;test_session[query_recent_period]=2419200&amp;amp;test_session[test_group]=&amp;amp;test_session[test_host]=&amp;amp;test_session[user_id]=&amp;amp;test_set[test_set_script_id]=f6a12204-32c3-11e0-a61c-52540025f9ae&amp;amp;utf8=%E2%9C%93&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/sub_tests/query?commit=Update+results&amp;amp;page=2&amp;amp;sub_test[query_bugs]=&amp;amp;sub_test[status]=FAIL&amp;amp;sub_test[sub_test_script_id]=fcadf0d2-32c3-11e0-a61c-52540025f9ae&amp;amp;test_node[architecture_type_id]=&amp;amp;test_node[distribution_type_id]=&amp;amp;test_node[file_system_type_id]=&amp;amp;test_node[lustre_branch_id]=24a6947e-04a9-11e1-bb5f-52540025f9af&amp;amp;test_node[os_type_id]=&amp;amp;test_node_network[network_type_id]=&amp;amp;test_session[query_date]=&amp;amp;test_session[query_recent_period]=2419200&amp;amp;test_session[test_group]=&amp;amp;test_session[test_host]=&amp;amp;test_session[user_id]=&amp;amp;test_set[test_set_script_id]=f6a12204-32c3-11e0-a61c-52540025f9ae&amp;amp;utf8=%E2%9C%93&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="65073" author="pjones" created="Mon, 26 Aug 2013 16:30:23 +0000"  >&lt;p&gt;Bob&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="65274" author="bogl" created="Wed, 28 Aug 2013 16:53:13 +0000"  >&lt;p&gt;A couple of key features seen in all the instances found:&lt;br/&gt;
1) only seen in review-zfs test runs, not any in review&lt;br/&gt;
2) test_86 failure isn&apos;t the first failed test in replay-single.  Always follows other failures, not always the same ones.  subtests in test_58 and test_85 are most common.&lt;/p&gt;

&lt;p&gt;based on 1) we might want to get a zfs expert looking at this.&lt;/p&gt;

&lt;p&gt;I am continuing to try to narrow it down.&lt;/p&gt;</comment>
                            <comment id="65275" author="bogl" created="Wed, 28 Aug 2013 17:01:03 +0000"  >&lt;p&gt;Another fact; haven&apos;t been any instances seen at all since 8/19.  wondering if the problem may have been fixed by a more recent commit.&lt;/p&gt;</comment>
                            <comment id="65287" author="bogl" created="Wed, 28 Aug 2013 17:53:06 +0000"  >&lt;p&gt;Surveying all the instances the latest common parent is the commit for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3155&quot; title=&quot;Permanent parameters with lctl set_param -P&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3155&quot;&gt;&lt;del&gt;LU-3155&lt;/del&gt;&lt;/a&gt;. That is the same one Andreas called out as suspicious in his comment.  Evidence is stacking up that it&apos;s the cause.&lt;/p&gt;</comment>
                            <comment id="65736" author="bogl" created="Wed, 4 Sep 2013 14:59:27 +0000"  >&lt;p&gt;Since evidence suggests &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3155&quot; title=&quot;Permanent parameters with lctl set_param -P&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3155&quot;&gt;&lt;del&gt;LU-3155&lt;/del&gt;&lt;/a&gt; was the cause of this problem we need the author to comment.&lt;/p&gt;</comment>
                            <comment id="65737" author="bogl" created="Wed, 4 Sep 2013 15:01:53 +0000"  >&lt;p&gt;There is now at least one counterexample to the connection of this bug to zfs.  At least 1 recent failure was seen in a review run: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/5df51836-132a-11e3-8c44-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/5df51836-132a-11e3-8c44-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Still happens a lot more with zfs.&lt;/p&gt;</comment>
                            <comment id="65819" author="artem_blagodarenko" created="Thu, 5 Sep 2013 09:59:25 +0000"  >&lt;p&gt;from replay-single.test_86.debug_log.client-26vm2.1378029549 :&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;00000100:02020000:0.0:1378029519.217418:0:22466:0:(client.c:1168:ptlrpc_check_status()) 11-0: MGC10.10.4.154@tcp: Communicating with 10.10.4.154@tcp, operation ldlm_enqueue failed with -107.
.. 

10000000:01000000:0.0:1378029519.217530:0:22466:0:(mgc_request.c:1849:mgc_process_log()) Can&apos;t get cfg lock: -107
10000000:01000000:0.0:1378029519.217535:0:22466:0:(mgc_request.c:1868:mgc_process_log()) MGC10.10.4.154@tcp: configuration from log &lt;span class=&quot;code-quote&quot;&gt;&apos;lustre-client&apos;&lt;/span&gt; failed (-5).
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;The test is called &quot;replay-single test 86: umount server after clear nid_stats should not hit LBUG&quot; so it looks like we unmount server before config file is processed.&lt;/p&gt;
</comment>
                            <comment id="125114" author="sarah" created="Tue, 25 Aug 2015 20:31:35 +0000"  >&lt;p&gt;hit this error in interop testing between 2.7.0 server and master RHEL6.6 client:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/bbeec3b0-454b-11e5-a64b-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/bbeec3b0-454b-11e5-a64b-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="127259" author="sarah" created="Mon, 14 Sep 2015 17:56:48 +0000"  >&lt;p&gt;another instance:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/3d5c7066-5157-11e5-9f68-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/3d5c7066-5157-11e5-9f68-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="20513">LU-3800</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="18333">LU-3155</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvypr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9816</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>