<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:24:24 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-9234] replay-single test_70f: checksum doesn&apos;t match</title>
                <link>https://jira.whamcloud.com/browse/LU-9234</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sessions/1a6bc6e8-0a05-11e7-9053-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sessions/1a6bc6e8-0a05-11e7-9053-5254006e85c2&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;After unmounting/mounting an OST, client detects a checksum mismatch:&lt;/p&gt;

&lt;p&gt;test_log:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;CMD: onyx-35vm4 umount -d /mnt/lustre-ost1
CMD: onyx-35vm4 lsmod | grep lnet &amp;gt; /dev/null &amp;amp;&amp;amp; lctl dl | grep &apos; ST &apos;
reboot facets: ost1
Failover ost1 to onyx-35vm4
03:10:44 (1489572644) waiting for onyx-35vm4 network 900 secs ...
03:10:44 (1489572644) network interface is UP
CMD: onyx-35vm4 hostname
mount facets: ost1
CMD: onyx-35vm4 test -b /dev/lvm-Role_OSS/P1
CMD: onyx-35vm4 e2label /dev/lvm-Role_OSS/P1
Starting ost1:   /dev/lvm-Role_OSS/P1 /mnt/lustre-ost1
CMD: onyx-35vm4 mkdir -p /mnt/lustre-ost1; mount -t lustre
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;followed by:&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;CMD: onyx-35vm6 md5sum /mnt/lustre/d70f.replay-single/f70f.replay-single.onyx-35vm5.onyx.hpdd.intel.com
onyx-35vm5: osc.lustre-OST0000-osc-*.ost_server_uuid in FULL state after 3 sec
onyx-35vm6: osc.lustre-OST0000-osc-*.ost_server_uuid in FULL state after 3 sec
 replay-single test_70f: @@@@@@ FAIL: /mnt/lustre/d70f.replay-single/f70f.replay-single.onyx-35vm5.onyx.hpdd.intel.com: checksum doesn&apos;t match on onyx-35vm6 
  Trace dump:
  = /usr/lib64/lustre/tests/test-framework.sh:4841:error()
  = /usr/lib64/lustre/tests/replay-single.sh:2334:test_70f_write_and_read()
  = /usr/lib64/lustre/tests/replay-single.sh:2350:test_70f_loop()
  = /usr/lib64/lustre/tests/replay-single.sh:2394:test_70f()
  = /usr/lib64/lustre/tests/test-framework.sh:5117:run_one()
  = /usr/lib64/lustre/tests/test-framework.sh:5156:run_one_logged()
  = /usr/lib64/lustre/tests/test-framework.sh:5003:run_test()
  = /usr/lib64/lustre/tests/replay-single.sh:2415:main()
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>onyx-35vm3 thru 6, Interop test, &lt;br/&gt;
RHEL7.3/ldiskfs, branch master, v2.9.54, b3541, 2.9 Lustre, &lt;br/&gt;
Client 2.10 Lustre&lt;br/&gt;
</environment>
        <key id="44904">LU-9234</key>
            <summary>replay-single test_70f: checksum doesn&apos;t match</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="sarah">Sarah Liu</assignee>
                                    <reporter username="jcasper">James Casper</reporter>
                        <labels>
                    </labels>
                <created>Mon, 20 Mar 2017 23:19:14 +0000</created>
                <updated>Tue, 27 Mar 2018 16:43:50 +0000</updated>
                            <resolved>Tue, 27 Mar 2018 16:43:50 +0000</resolved>
                                    <version>Lustre 2.10.0</version>
                    <version>Lustre 2.11.0</version>
                                    <fixVersion>Lustre 2.10.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="189102" author="jamesanunez" created="Tue, 21 Mar 2017 15:01:28 +0000"  >&lt;p&gt;In the console for the OSTs, we see:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;03:11:42:[18142.619725] Lustre: lustre-OST0000: Will be in recovery for at least 1:00, or until 3 clients reconnect
03:11:42:[18144.679276] LustreError: 32511:0:(ofd_grant.c:686:ofd_grant_check()) lustre-OST0000: cli df47be9e-3378-d13b-7555-c154ed48e9ba is replaying OST_WRITE while one rnb hasn&apos;t OBD_BRW_FROM_GRANT set (0x108)
03:11:42:[18144.711883] LustreError: 168-f: BAD WRITE CHECKSUM: lustre-OST0000 from 12345-10.2.4.142@tcp inode [0x20001a213:0xb88d:0x0] object 0x0:9508 extent [0-1048575]: client csum 32a1611e, server csum 66771e72
03:11:42:[18144.873216] Lustre: lustre-OST0000: Recovery over after 0:03, of 3 clients 3 recovered and 0 were evicted.
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Looking through Maloo, replay-single test 70f started failing at the beginning of February of this year (2017) and has failed 60 times for the full test group since that time. All failures I&apos;ve seen are during interop testing.&lt;/p&gt;

&lt;p&gt;Some early failure logs are at:&lt;br/&gt;
2017-02-03 - (upstream client + master servers) &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/766efa26-eaf4-11e6-af25-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/766efa26-eaf4-11e6-af25-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2017-02-04 - (master clients + b2_8 servers) &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/2122fcde-eba8-11e6-848c-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/2122fcde-eba8-11e6-848c-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2017-02-04 - (master clients + b2_9 servers) &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/3e6136de-eba9-11e6-9bb9-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/3e6136de-eba9-11e6-9bb9-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2017-02-07 -  (master clients + b2_8 servers) &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/deae1082-ee27-11e6-bbfe-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/deae1082-ee27-11e6-bbfe-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2017-02-07 -  (master clients + b2_8 servers)  &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/bf86630e-edf9-11e6-8f6d-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/bf86630e-edf9-11e6-8f6d-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="189141" author="pjones" created="Tue, 21 Mar 2017 17:24:24 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Could you please advise on this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="190361" author="bobijam" created="Sat, 1 Apr 2017 04:17:04 +0000"  >&lt;p&gt;the replay-single 70f only works for OSS server version after 2.9.52.60 (the issue is &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1573&quot; title=&quot;avoid data corruption for direct io data&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1573&quot;&gt;&lt;del&gt;LU-1573&lt;/del&gt;&lt;/a&gt;, patch #16680 with git commit 1d2fbade1b658db4386091e7938d9483f7aa4a05), so 2.8/2.9 server does not contain this fix.&lt;/p&gt;

&lt;p&gt;As for the master server failure case, I checked the maloo report, their OSS version is 2.9.52.54.gc6f5e81, it does not have this fix as well.&lt;/p&gt;</comment>
                            <comment id="192718" author="gerrit" created="Wed, 19 Apr 2017 16:52:17 +0000"  >&lt;p&gt;Wei Liu (wei3.liu@intel.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/26739&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/26739&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9234&quot; title=&quot;replay-single test_70f: checksum doesn&amp;#39;t match&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9234&quot;&gt;&lt;del&gt;LU-9234&lt;/del&gt;&lt;/a&gt; test: Skip test_70f if OSS version is older than 2.9.53&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 70d77276b26a9a92621bc4aef4f3f04cb6da310f&lt;/p&gt;</comment>
                            <comment id="194028" author="gerrit" created="Mon, 1 May 2017 17:47:30 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/26739/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/26739/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9234&quot; title=&quot;replay-single test_70f: checksum doesn&amp;#39;t match&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9234&quot;&gt;&lt;del&gt;LU-9234&lt;/del&gt;&lt;/a&gt; test: Skip test_70f if OSS version is older than 2.9.53&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 00db1ffe72bc1f4504adfaba539a1ec4f0fde74b&lt;/p&gt;</comment>
                            <comment id="194058" author="pjones" created="Mon, 1 May 2017 18:42:50 +0000"  >&lt;p&gt;Landed for 2.10&lt;/p&gt;</comment>
                            <comment id="206173" author="casperjx" created="Wed, 23 Aug 2017 17:39:55 +0000"  >&lt;p&gt;Seen again in 2.10.51 (b3620):&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sessions/c4874eda-04c9-40c5-9e92-b8e7574bd5fe&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sessions/c4874eda-04c9-40c5-9e92-b8e7574bd5fe&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="218660" author="jamesanunez" created="Fri, 19 Jan 2018 17:40:52 +0000"  >&lt;p&gt;There seems to still be an issue with checksums that shows up in replay-single test 87a, but I&apos;ll open a new ticket for that issue.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="50917">LU-10702</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzz7sv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>