<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:36:12 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-3704] sanity-hsm test_21 - test_24 Error: &apos;could not release file&apos;</title>
                <link>https://jira.whamcloud.com/browse/LU-3704</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Sanity-hsm test 21 seems to fail alot. &lt;/p&gt;

&lt;p&gt;An example:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/adac0ef6-fb6b-11e2-8c6e-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/adac0ef6-fb6b-11e2-8c6e-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;&apos;could not release file&apos; seem to be the slightly more common error. &lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;test_21 	

    Error: &apos;could not release file&apos;
    Failure Rate: 32.00% of last 100 executions [all branches] 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;The test logs look like. &lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;== sanity-hsm test 21: Simple release tests == 09:25:28 (1375374328)
2+0 records in
2+0 records out
2097152 bytes (2.1 MB) copied, 0.387647 s, 5.4 MB/s
Cannot send HSM request (use of /mnt/lustre/d0.sanity-hsm/d21/test_release): Device or resource busy
 sanity-hsm test_21: @@@@@@ FAIL: could not release file 
  Trace dump:
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;


&lt;p&gt;test 3 and 22-24 errors look to all be related. &lt;/p&gt;</description>
                <environment>autotest</environment>
        <key id="20195">LU-3704</key>
            <summary>sanity-hsm test_21 - test_24 Error: &apos;could not release file&apos;</summary>
                <type id="7" iconUrl="https://jira.whamcloud.com/images/icons/issuetypes/task_agile.png">Technical task</type>
                            <parent id="20020">LU-3647</parent>
                                    <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="bfaccini">Bruno Faccini</assignee>
                                    <reporter username="keith">Keith Mannthey</reporter>
                        <labels>
                            <label>HSM</label>
                    </labels>
                <created>Mon, 5 Aug 2013 22:07:06 +0000</created>
                <updated>Mon, 21 Oct 2013 20:32:51 +0000</updated>
                            <resolved>Mon, 2 Sep 2013 16:41:00 +0000</resolved>
                                    <version>Lustre 2.5.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>8</watches>
                                                                            <comments>
                            <comment id="63969" author="adegremont" created="Fri, 9 Aug 2013 14:54:13 +0000"  >&lt;p&gt;I think that test #3 and tests #21-24 are not related.&lt;/p&gt;

&lt;ul&gt;
	&lt;li&gt;test #3 is not doing any &quot;hsm_release&quot; commands.&lt;br/&gt;
It is failing to copy /etc/passwd into lustre mount point. May be there is a side effect on the system with this file. May be we should replace this copy by another to create the file.&lt;/li&gt;
&lt;/ul&gt;


&lt;ul&gt;
	&lt;li&gt;tests #21-24.&lt;br/&gt;
I&apos;ve looked at test #21. It is failing somewhere at the end of the release process, when closing the file. I&apos;m lacking debug information to detect exactly where this is failing. EBUSY is replied when MDS_CLOSE is replied but OBD_FL_RELEASE flag was not set for some reasons. It could be nice to have more debug for that.&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="63976" author="keith" created="Fri, 9 Aug 2013 16:02:59 +0000"  >&lt;p&gt;The reason I mention they might be linked is they seem to fail together alot. &lt;/p&gt;

&lt;p&gt;Another example:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/0c378cde-ff90-11e2-a3fb-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/0c378cde-ff90-11e2-a3fb-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;I will open LUs to track the other the other subtests. &lt;/p&gt;</comment>
                            <comment id="64133" author="jamesanunez" created="Mon, 12 Aug 2013 23:19:15 +0000"  >&lt;p&gt;Another set of test 3, 21-24 failures at: &lt;a href=&quot;https://maloo.whamcloud.com/test_sets/aa3d4616-001d-11e3-a856-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/aa3d4616-001d-11e3-a856-52540035b04c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="64141" author="jay" created="Tue, 13 Aug 2013 01:04:53 +0000"  >&lt;p&gt;I looked at the failure of test_3.&lt;/p&gt;

&lt;p&gt;The failure occurred when the client was trying to set system.posix_acl_access since test_3 uses `cp -p&apos; to copy file. Before doing that, it tried to update the client xattr cache so the calling sequence is as follows:&lt;/p&gt;

&lt;p&gt;ll_setxattr -&amp;gt; ll_xattr_cache_update -&amp;gt; ll_xattr_cache_refill -&amp;gt; IT_GETXATTR -&amp;gt; mdt_getxattr.&lt;/p&gt;

&lt;p&gt;However, in mdt_getxattr(), the code snippet below:&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;                eadatasize = mo_xattr_list(info-&amp;gt;mti_env, next, buf);
                &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (eadatasize &amp;lt; 0)
                        GOTO(out, rc = eadatasize);

                v = req_capsule_server_get(info-&amp;gt;mti_pill, &amp;amp;RMF_EAVALS);
                sizes = req_capsule_server_get(info-&amp;gt;mti_pill,
                                                &amp;amp;RMF_EAVALS_LENS);

                &lt;span class=&quot;code-comment&quot;&gt;/* Fill out EAVALS and EAVALS_LENS */&lt;/span&gt;
                &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; (b = buf-&amp;gt;lb_buf;
                     b &amp;lt; (&lt;span class=&quot;code-object&quot;&gt;char&lt;/span&gt; *)buf-&amp;gt;lb_buf + eadatasize;
                     b += strlen(b) + 1, v += rc) {
                        buf2.lb_buf = v;
                        rc = mdt_getxattr_one(info, b, next, &amp;amp;buf2, med, uc);
                        &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (rc &amp;lt; 0)
                                GOTO(out, rc);
                        sizes[eavallens] = rc;
                        buf2.lb_len -= rc;
                        eavallens++;
                        eavallen += rc;
                }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;returned ENODATA from mdt_getxattr_one(). I don&apos;t know what&apos;s the xattr name due to lack of log on the MDT side.&lt;/p&gt;
</comment>
                            <comment id="64599" author="bfaccini" created="Tue, 20 Aug 2013 13:47:49 +0000"  >&lt;p&gt;test_3 failures are due to, as Jinshan detailled, ENODATA return during &lt;span class=&quot;error&quot;&gt;&amp;#91;cp -p /etc/passwd $TESTFILE.append || error &amp;quot;could not create file&amp;quot;&amp;#93;&lt;/span&gt; command when trying to set &quot;system.posix_acl_access&quot; XATTR (but why ?). And it is now specifically addressed by &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3730&quot; title=&quot;sanity-hsm test_3 Error: &amp;#39;could not create file&amp;#39; &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3730&quot;&gt;&lt;del&gt;LU-3730&lt;/del&gt;&lt;/a&gt; !!&lt;/p&gt;

&lt;p&gt;test_21-24 failures, as detailled by Aurelien and to be addressed here, looks more like a race/timing issue (like test_21 &quot;wrong block number&quot; errors for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3700&quot; title=&quot;sanity-hsm test_21 Error: &amp;#39;wrong block number&amp;#39; &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3700&quot;&gt;&lt;del&gt;LU-3700&lt;/del&gt;&lt;/a&gt;) due to current usage of &quot;lfs hsm_set --archived --exist &amp;lt;file&amp;gt;&quot; command to mimic &quot;lfs hsm_archive &amp;lt;file&amp;gt;&quot;. &quot;wait_request_state $fid ARCHIVE SUCCEED&quot; may need to be also used here ?&lt;/p&gt;

&lt;p&gt;Will try to setup a platform to reproduce problem, with HSM debug traces enabled on Client/MDS VMs, and running sanity-hsm tests in a loop.&lt;/p&gt;</comment>
                            <comment id="65437" author="bfaccini" created="Fri, 30 Aug 2013 14:06:12 +0000"  >&lt;p&gt;I am not able to reproduce problem with current master, even by running sanity-hsm/test_&lt;span class=&quot;error&quot;&gt;&amp;#91;21-24&amp;#93;&lt;/span&gt; in a loop. I only had to avoid/ignore test_24 &quot;atime should be ...&quot; errors since it is still being worked by John in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3814&quot; title=&quot;Fix sanity-hsm test 24: &amp;quot;Release does not change a/mtime (i/o)&amp;quot;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3814&quot;&gt;&lt;del&gt;LU-3814&lt;/del&gt;&lt;/a&gt;/&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3832&quot; title=&quot;osc_io_read_start() ignores O_NOATIME, updates i_atime&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3832&quot;&gt;&lt;del&gt;LU-3832&lt;/del&gt;&lt;/a&gt; I think, when test_24 is actually not run by default.&lt;/p&gt;

&lt;p&gt;BTW, according to Maloo reports test_&lt;span class=&quot;error&quot;&gt;&amp;#91;21-24&amp;#93;&lt;/span&gt; failures for &apos;could not release file&apos; stopped around Aug. 14th. And this seems to match with landing of patch for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3561&quot; title=&quot;Add a sanity test for HSM&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3561&quot;&gt;&lt;del&gt;LU-3561&lt;/del&gt;&lt;/a&gt; that brings &quot;real&quot; HSM features (copytool, lfs hsm-commands usage instead of hsm-flags setting) in tests and according tools testing.&lt;/p&gt;

&lt;p&gt;So my strong assumption is that that this ticket can be closed because unrelated now.&lt;/p&gt;</comment>
                            <comment id="65559" author="bfaccini" created="Mon, 2 Sep 2013 16:41:00 +0000"  >&lt;p&gt;To be re-opened in case of re-occurence.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="20277">LU-3730</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="20190">LU-3700</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvx7z:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9553</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                </customfields>
    </item>
</channel>
</rss>