<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:36:40 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-10616] replay-single test_70b fails with &apos;rundbench load on &lt;hostname(s)&gt; failed!&apos; </title>
                <link>https://jira.whamcloud.com/browse/LU-10616</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;replay-single test_70b fails with two error messages&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;replay-single test_70b: @@@@@@ FAIL: dbench stopped on some of onyx-31vm1.onyx.hpdd.intel.com,onyx-31vm2!
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;and later&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;replay-single test_70b: @@@@@@ FAIL: rundbench load on onyx-31vm1.onyx.hpdd.intel.com,onyx-31vm2 failed! 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Looking at the suite_log, we see &lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;CMD: onyx-31vm1.onyx.hpdd.intel.com,onyx-31vm2 killall -0 dbench
onyx-31vm1: [3] open ./clients/client0 failed for handle 16385 (No such file or directory)
onyx-31vm1: (4) ERROR: handle 16385 was not found
onyx-31vm1: Child failed with status 1
onyx-31vm1: dbench: no process found
onyx-31vm1: dbench: no process found
 replay-single test_70b: @@@@@@ FAIL: dbench stopped on some of onyx-31vm1.onyx.hpdd.intel.com,onyx-31vm2! 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;The only thing that looks suspicious in the console logs is on the MDS1, 3&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[ 5354.241985] Lustre: DEBUG MARKER: Started rundbench load pid=3403 ...
[ 5354.488828] LustreError: 12371:0:(osd_oi.c:978:osd_idc_find_or_init()) lustre-MDT0000: can&apos;t lookup: rc = -2
[ 5354.753146] Lustre: DEBUG MARKER: /usr/sbin/lctl mark  replay-single test_70b: @@@@@@ FAIL: dbench stopped on some of onyx-31vm1.onyx.hpdd.intel.com,onyx-31vm2! 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;This test has failed in this way many times, so far, for only full test sessions with DNE configured and ZFS:&lt;br/&gt;
2.10.57 el7 build 3703 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/46a0b60a-078f-11e8-bd00-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/46a0b60a-078f-11e8-bd00-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.57 el7 build 3702 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/13cdeb9e-0352-11e8-a10a-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/13cdeb9e-0352-11e8-a10a-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.57 el7 build 3700 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/fa0a850e-014f-11e8-a6ad-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/fa0a850e-014f-11e8-a6ad-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.57 el7 build 3697 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/ebd4b25e-fd83-11e7-a7cd-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/ebd4b25e-fd83-11e7-a7cd-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.57 el7 patchless build 59 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/dee6191a-ffaf-11e7-a6ad-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/dee6191a-ffaf-11e7-a6ad-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.57 el7 patchless build 58 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/16fa9310-fe7c-11e7-a6ad-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/16fa9310-fe7c-11e7-a6ad-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.56 el7 build 3693 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/d309f58a-f77b-11e7-bd00-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/d309f58a-f77b-11e7-bd00-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.56 el7 patchless build 53 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/38f48bae-f636-11e7-94c7-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/38f48bae-f636-11e7-94c7-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.56 el7 patchless build 50 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/c46aeb7c-f228-11e7-8c43-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/c46aeb7c-f228-11e7-8c43-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.56 el7 build 3685 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/6c00afc0-e7c0-11e7-8027-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/6c00afc0-e7c0-11e7-8027-52540065bddc&lt;/a&gt;&lt;br/&gt;
2.10.56 el7 patchless build 44 &#8211; &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/53f8d684-e674-11e7-a066-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/53f8d684-e674-11e7-a066-52540065bddc&lt;/a&gt;&lt;/p&gt;
</description>
                <environment></environment>
        <key id="50612">LU-10616</key>
            <summary>replay-single test_70b fails with &apos;rundbench load on &lt;hostname(s)&gt; failed!&apos; </summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="laisiyao">Lai Siyao</assignee>
                                    <reporter username="jamesanunez">James Nunez</reporter>
                        <labels>
                            <label>dne</label>
                            <label>zfs</label>
                    </labels>
                <created>Tue, 6 Feb 2018 18:45:24 +0000</created>
                <updated>Tue, 24 Jan 2023 22:50:58 +0000</updated>
                                            <version>Lustre 2.11.0</version>
                    <version>Lustre 2.12.0</version>
                    <version>Lustre 2.13.0</version>
                    <version>Lustre 2.10.6</version>
                    <version>Lustre 2.10.7</version>
                    <version>Lustre 2.12.3</version>
                    <version>Lustre 2.14.0</version>
                    <version>Lustre 2.12.5</version>
                    <version>Lustre 2.15.1</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="220630" author="jamesanunez" created="Fri, 9 Feb 2018 18:55:52 +0000"  >&lt;p&gt;From John Hammond, it looks like there is an issue with dbench start up as seen in the suite_log&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;trevis-11vm1: running &apos;dbench 1 -t 300&apos; on /mnt/lustre/d70b.replay-single/trevis-11vm1.trevis.hpdd.intel.com at Thu Feb  1 01:34:50 UTC 2018
trevis-11vm1: dbench PID=30955
trevis-11vm1: dbench version 4.00 - Copyright Andrew Tridgell 1999-2004
trevis-11vm1: 
trevis-11vm1: Running for 300 seconds with load &apos;client.txt&apos; and minimum warmup 60 secs
trevis-11vm1: failed to create barrier semaphore 
trevis-11vm1: 0 of 1 processes prepared for launch   0 sec
trevis-11vm2: dbench version 4.00 - Copyright Andrew Tridgell 1999-2004
trevis-11vm2: 
trevis-11vm2: Running for 300 seconds with load &apos;client.txt&apos; and minimum warmup 60 secs
trevis-11vm2: failed to create barrier semaphore 
trevis-11vm2: 0 of 1 processes prepared for launch   0 sec
CMD: trevis-11vm1.trevis.hpdd.intel.com,trevis-11vm2 killall -0 dbench
trevis-11vm1: 1 of 1 processes prepared for launch   0 sec
trevis-11vm1: releasing clients
trevis-11vm2: 1 of 1 processes prepared for launch   0 sec
trevis-11vm2: releasing clients
trevis-11vm1: [3] open ./clients/client0 failed for handle 16385 (No such file or directory)
trevis-11vm1: (4) ERROR: handle 16385 was not found
trevis-11vm1: Child failed with status 1
trevis-11vm1: dbench: no process found
trevis-11vm1: dbench: no process found
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="227029" author="sarah" created="Wed, 2 May 2018 00:25:03 +0000"  >&lt;p&gt;+1 on master 2.11.51 failover&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/7d85d5ce-492f-11e8-960d-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/7d85d5ce-492f-11e8-960d-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="257497" author="hornc" created="Fri, 1 Nov 2019 15:31:26 +0000"  >&lt;p&gt;+1 &lt;a href=&quot;https://testing.whamcloud.com/sub_tests/13bce654-fc76-11e9-98f1-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/sub_tests/13bce654-fc76-11e9-98f1-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="260656" author="adilger" created="Tue, 7 Jan 2020 00:25:50 +0000"  >&lt;p&gt;+1 on master: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/9333fec4-2406-11ea-b1e8-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/9333fec4-2406-11ea-b1e8-52540065bddc&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="286246" author="eaujames" created="Mon, 30 Nov 2020 12:09:20 +0000"  >&lt;p&gt;Hello,&lt;/p&gt;

&lt;p&gt;I have the same kind of messages on: &lt;a href=&quot;https://testing.whamcloud.com/sub_tests/a7c49599-b0e2-49e1-a4af-9111f676fdcf&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/sub_tests/a7c49599-b0e2-49e1-a4af-9111f676fdcf&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Except the message:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
trevis-9vm4: [341] open ./clients/client0/~dmtmp/PARADOX/COURSES.DB failed &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; handle 9977 (Stale file handle)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="304985" author="adilger" created="Sat, 19 Jun 2021 17:46:49 +0000"  >&lt;p&gt;+1 on master &lt;a href=&quot;https://testing.whamcloud.com/test_sets/b5f87cba-d087-45dc-85ef-e1005ef15186&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/b5f87cba-d087-45dc-85ef-e1005ef15186&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="310186" author="adilger" created="Fri, 13 Aug 2021 19:08:56 +0000"  >&lt;p&gt;+1 on master &lt;a href=&quot;https://testing.whamcloud.com/test_sets/1c452361-2846-41bd-af35-995e1de3fd99&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/1c452361-2846-41bd-af35-995e1de3fd99&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="319508" author="artem_blagodarenko" created="Tue, 30 Nov 2021 08:08:45 +0000"  >&lt;p&gt;+1 on master &lt;a href=&quot;https://testing.whamcloud.com/test_sets/ee775d6f-00db-41b2-ad02-d4ae7e31ce6c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/ee775d6f-00db-41b2-ad02-d4ae7e31ce6c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="321561" author="qian_wc" created="Mon, 27 Dec 2021 08:38:23 +0000"  >&lt;p&gt;+1 on master &lt;a href=&quot;https://testing.whamcloud.com/test_sets/c154d88e-a784-4023-9c59-f40662559bea&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/c154d88e-a784-4023-9c59-f40662559bea&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="323076" author="adilger" created="Tue, 18 Jan 2022 19:07:33 +0000"  >&lt;p&gt;+1 on master: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/d3c778e5-e533-4a1d-8dce-263b64809701&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/d3c778e5-e533-4a1d-8dce-263b64809701&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="323614" author="artem_blagodarenko" created="Sat, 22 Jan 2022 17:40:48 +0000"  >&lt;p&gt;+1 &lt;a href=&quot;https://testing.whamcloud.com/test_sets/15d4b4b3-8a48-4743-b935-bf96afb0e27d&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/15d4b4b3-8a48-4743-b935-bf96afb0e27d&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="360258" author="adilger" created="Tue, 24 Jan 2023 22:50:58 +0000"  >&lt;p&gt;Lai, should replay-single test_70b be updated to add &quot;&lt;tt&gt;stack_trap fail_abort_cleanup&lt;/tt&gt;&quot; so that it can clean up afterward?  However, while the test is doing failover (via &lt;tt&gt;test-framework.sh::fail()-&amp;gt;facet_failover()&lt;/tt&gt;) it doesn&apos;t look like this subtest is actually aborting recovery, so it &lt;b&gt;shouldn&apos;t&lt;/b&gt; be seeing this kind of problem.&lt;/p&gt;

&lt;p&gt;This subtest is failing pretty regularly, could you please investigate why it is having problems during recovery?  It should be possible to use &quot;&lt;tt&gt;Test-Parameters: fortestonly testlist=replay-single env=ONLY=70b,ONLY_REPEAT=100 livedebug&lt;/tt&gt;&quot; to run 70b until it is hit and then leave the node in that state to log in and debug.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="64856">LU-14791</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="64981">LU-14813</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="68986">LU-15624</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="73365">LU-16336</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="71583">LU-16065</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzsbb:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>