<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:15:21 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-15089] sanity-lnet test_230: expected number of tcp connections 18</title>
                <link>https://jira.whamcloud.com/browse/LU-15089</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Elena &amp;lt;elena.gryaznova@hpe.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/9d97b8d9-9da1-4f76-a595-f827627ca5b9&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/9d97b8d9-9da1-4f76-a595-f827627ca5b9&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_230 failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;expected number of tcp connections 18
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;







&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
sanity-lnet test_230 - expected number of tcp connections 18&lt;/p&gt;</description>
                <environment></environment>
        <key id="66597">LU-15089</key>
            <summary>sanity-lnet test_230: expected number of tcp connections 18</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="ssmirnov">Serguei Smirnov</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Tue, 12 Oct 2021 16:21:25 +0000</created>
                <updated>Wed, 3 Nov 2021 03:30:15 +0000</updated>
                            <resolved>Wed, 3 Nov 2021 03:30:15 +0000</resolved>
                                    <version>Lustre 2.15.0</version>
                                    <fixVersion>Lustre 2.15.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="316238" author="adilger" created="Thu, 21 Oct 2021 19:18:02 +0000"  >&lt;p&gt;Serguei, this looks like it is related to the &lt;tt&gt;conns_per_peer&lt;/tt&gt; patch?&lt;/p&gt;</comment>
                            <comment id="316240" author="adilger" created="Thu, 21 Oct 2021 19:23:52 +0000"  >&lt;p&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/ViewProfile.jspa?name=jamesanunez&quot; class=&quot;user-hover&quot; rel=&quot;jamesanunez&quot;&gt;jamesanunez&lt;/a&gt;, something is broken with &lt;tt&gt;sanity-lnet&lt;/tt&gt;.  This subtest is continually failing:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;test_230 	

    Error: &apos;expected number of tcp connections 18&apos;
    Failure Rate: 35.00% of most recent 100 runs, 0 skipped (all branches) 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;(70/207 in the past 3 days) but the &lt;tt&gt;sanity-lnet&lt;/tt&gt; test run is always being marked as &quot;PASS&quot;:&lt;br/&gt;
&lt;a href=&quot;https://testing.whamcloud.com/test_sets/64366b2e-89d8-4fea-a98d-cd5a8af7ef21&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/64366b2e-89d8-4fea-a98d-cd5a8af7ef21&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;I suspect there is something missing at the end of &lt;tt&gt;sanity-lnet.sh&lt;/tt&gt; that is supposed to check for the failure status?&lt;/p&gt;</comment>
                            <comment id="316241" author="adilger" created="Thu, 21 Oct 2021 19:28:13 +0000"  >&lt;p&gt;The test failure was clearly introduced by patch &lt;a href=&quot;https://review.whamcloud.com/44417&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/44417&lt;/a&gt; &quot;&lt;tt&gt;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-12815&quot; title=&quot;Create multiple TCP sockets per SockLND&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-12815&quot;&gt;&lt;del&gt;LU-12815&lt;/del&gt;&lt;/a&gt; socklnd: set conns_per_peer based on link speed&lt;/tt&gt;&quot; because it was first hit when testing that patch, then immediately started failing regularly on master on 2021-08-17 after it landed.&lt;/p&gt;</comment>
                            <comment id="316259" author="gerrit" created="Thu, 21 Oct 2021 21:09:30 +0000"  >&lt;p&gt;&quot;Serguei Smirnov &amp;lt;ssmirnov@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/45331&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45331&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15089&quot; title=&quot;sanity-lnet test_230: expected number of tcp connections 18&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15089&quot;&gt;&lt;del&gt;LU-15089&lt;/del&gt;&lt;/a&gt; tests: allow enough time to create tcp connections&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 7a432a1048bb45b0265a3308520c0ff5b7671287&lt;/p&gt;</comment>
                            <comment id="316271" author="adilger" created="Fri, 22 Oct 2021 01:17:10 +0000"  >&lt;p&gt;It isn&apos;t obvious why &lt;tt&gt;sanity-lnet.sh&lt;/tt&gt; is not reporting a failure when &lt;tt&gt;test_230()&lt;/tt&gt; is failing.  The script has mostly the same bits at the end as &lt;tt&gt;sanity.sh&lt;/tt&gt;:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;complete $SECONDS

cleanup_testsuite
exit_status
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;and the test logs clearly show that &lt;tt&gt;complete()&lt;/tt&gt; is finding the &lt;tt&gt;FAIL&lt;/tt&gt; in &lt;tt&gt;$TESTSUITELOG&lt;/tt&gt;, and &lt;tt&gt;cleanup_testsuite()&lt;/tt&gt; is run as seen by &quot;&lt;tt&gt;Cleaning up LNet&lt;/tt&gt;&quot;:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;== sanity-lnet test complete, duration 824 sec =========== 15:31:11 (1634830271)
sanity-lnet: FAIL: test_230 expected number of tcp connections 26
Cleaning up LNet
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;It then proceeds to format and mount a new filesystem (&lt;tt&gt;setupall()&lt;/tt&gt;), and the last line in the log is from &lt;tt&gt;init_param_vars()&lt;/tt&gt;, and then &lt;tt&gt;exit_status()&lt;/tt&gt; returns &quot;0&quot; (&lt;tt&gt;PASS&lt;/tt&gt;) instead of finding any error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;CMD: trevis-5vm9 /usr/sbin/lctl set_param lod.*.mdt_hash=crush
lod.lustre-MDT0000-mdtlov.mdt_hash=crush
CMD: trevis-5vm9 /usr/sbin/lctl set_param -P *.*.lbug_on_grant_miscount=1
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;The only thing that I can think of is that &lt;tt&gt;$TESTSUITELOG&lt;/tt&gt; is somehow unset/removed/truncated and the &lt;tt&gt;FAIL&lt;/tt&gt; line is missed?  However, I only see &lt;tt&gt;$TESTSUITELOG&lt;/tt&gt; being set/removed in &lt;tt&gt;init_test_env()&lt;/tt&gt; and that is only called at the start of the script.&lt;/p&gt;

&lt;p&gt;It might be worthwhile to print out a line in &lt;tt&gt;exit_status()&lt;/tt&gt; to help debug this:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
exit_status () {
        local status=0
        local logs=&lt;span class=&quot;code-quote&quot;&gt;&quot;$TESTSUITELOG $1&quot;&lt;/span&gt;

+       echo &lt;span class=&quot;code-quote&quot;&gt;&quot;== checking &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; failures in logs: &lt;span class=&quot;code-quote&quot;&gt;&apos;$logs&apos;&lt;/span&gt; ==&quot;&lt;/span&gt;
        &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; log in $logs; &lt;span class=&quot;code-keyword&quot;&gt;do&lt;/span&gt;
                &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; [ -f &lt;span class=&quot;code-quote&quot;&gt;&quot;$log&quot;&lt;/span&gt; ]; then
                        grep -qw FAIL $log &amp;amp;&amp;amp; status=1
                fi
        done

+       echo &lt;span class=&quot;code-quote&quot;&gt;&quot;== exiting with status=$status ==&quot;&lt;/span&gt;
        exit $status
}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="316362" author="hornc" created="Fri, 22 Oct 2021 17:40:47 +0000"  >&lt;p&gt;I think we are deleting $TESTSUITELOG in sanity-lnet.sh:cleanup_testsuite():&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;cleanup_testsuite() {
        trap &quot;&quot; EXIT
        # Cleanup any tmp files created by the sub tests
        rm -f $TMP/sanity-lnet*
        cleanup_netns
        cleanup_lnet
        if $restore_mounts; then
                setupall || error &quot;Failed to setup Lustre after test execution&quot;
        elif $restore_modules; then
                load_modules ||
                        error &quot;Couldn&apos;t load modules after test execution&quot;
        fi
        return 0
}
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;That &lt;tt&gt;rm &amp;#45;f $TMP/sanity-lnet*&lt;/tt&gt; should probably be &lt;tt&gt;rm &amp;#45;f $TMP/sanity-lnet-*.yaml&lt;/tt&gt;&lt;/p&gt;</comment>
                            <comment id="316373" author="hornc" created="Fri, 22 Oct 2021 18:25:26 +0000"  >&lt;p&gt;Opened &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15150&quot; class=&quot;external-link&quot; rel=&quot;nofollow&quot;&gt;https://jira.whamcloud.com/browse/LU-15150&lt;/a&gt; for ^&lt;/p&gt;</comment>
                            <comment id="317278" author="gerrit" created="Wed, 3 Nov 2021 02:37:19 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/45331/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/45331/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15089&quot; title=&quot;sanity-lnet test_230: expected number of tcp connections 18&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15089&quot;&gt;&lt;del&gt;LU-15089&lt;/del&gt;&lt;/a&gt; tests: allow enough time to create tcp connections&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 5c766b005bf3e0bca0efa9d87ccf230e7cba97cc&lt;/p&gt;</comment>
                            <comment id="317305" author="pjones" created="Wed, 3 Nov 2021 03:30:15 +0000"  >&lt;p&gt;Landed for 2.15&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="66798">LU-15150</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="66801">LU-15152</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i026yv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>