<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:30:42 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-16872] sanity: test_27M Error: &apos;(5) stripe count , should be 8 for append&apos;</title>
                <link>https://jira.whamcloud.com/browse/LU-16872</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for Frank Sehr &amp;lt;fsehr@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/46d1b101-8e4f-4415-bb49-ee39963275fe&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/46d1b101-8e4f-4415-bb49-ee39963275fe&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Test session details:&lt;br/&gt;
clients: &lt;a href=&quot;https://build.whamcloud.com/job/lustre-reviews/95319&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-reviews/95319&lt;/a&gt; - 4.18.0-425.10.1.el8_7.x86_64&lt;br/&gt;
servers: &lt;a href=&quot;https://build.whamcloud.com/job/lustre-reviews/95319&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-reviews/95319&lt;/a&gt; - 4.18.0-425.10.1.el8_lustre.x86_64&lt;/p&gt;

&lt;p&gt;== sanity test 27M: test O_APPEND striping =============== 03:40:09 (1685936409)&lt;br/&gt;
CMD: trevis-129vm4 /usr/sbin/lctl get_param -n version 2&amp;gt;/dev/null&lt;br/&gt;
striped dir -i3 -c2 -H crush2 /mnt/lustre/d27M.sanity&lt;br/&gt;
CMD: trevis-129vm4 /usr/sbin/lctl get_param -n mdd.lustre-MDT0000.append_pool&lt;br/&gt;
CMD: trevis-129vm4 /usr/sbin/lctl get_param -n mdd.lustre-MDT0000.append_stripe_count&lt;br/&gt;
CMD: trevis-129vm4,trevis-129vm5 /usr/sbin/lctl set_param mdd.*.append_stripe_count=0&lt;br/&gt;
mdd.lustre-MDT0000.append_stripe_count=0&lt;br/&gt;
mdd.lustre-MDT0002.append_stripe_count=0&lt;br/&gt;
mdd.lustre-MDT0001.append_stripe_count=0&lt;br/&gt;
mdd.lustre-MDT0003.append_stripe_count=0&lt;br/&gt;
CMD: trevis-129vm4,trevis-129vm5 /usr/sbin/lctl set_param mdd.*.append_stripe_count=2&lt;br/&gt;
mdd.lustre-MDT0000.append_stripe_count=2&lt;br/&gt;
mdd.lustre-MDT0002.append_stripe_count=2&lt;br/&gt;
mdd.lustre-MDT0001.append_stripe_count=2&lt;br/&gt;
mdd.lustre-MDT0003.append_stripe_count=2&lt;br/&gt;
CMD: trevis-129vm4,trevis-129vm5 /usr/sbin/lctl set_param mdd.*.append_stripe_count=-1&lt;br/&gt;
mdd.lustre-MDT0000.append_stripe_count=-1&lt;br/&gt;
mdd.lustre-MDT0002.append_stripe_count=-1&lt;br/&gt;
mdd.lustre-MDT0001.append_stripe_count=-1&lt;br/&gt;
mdd.lustre-MDT0003.append_stripe_count=-1&lt;br/&gt;
/usr/lib64/lustre/tests/sanity.sh: line 3101: /mnt/lustre/d27M.sanity/f27M.sanity.5: Invalid argument&lt;br/&gt;
lfs: getstripe for &apos;/mnt/lustre/d27M.sanity/f27M.sanity.5&apos; failed: No such file or directory&lt;br/&gt;
/usr/lib64/lustre/tests/sanity.sh: line 3103: [: -eq: unary operator expected&lt;br/&gt;
 sanity test_27M: @@@@@@ FAIL: (5) stripe count , should be 8 for append &lt;br/&gt;
  Trace dump:&lt;br/&gt;
  = /usr/lib64/lustre/tests/test-framework.sh:6585:error()&lt;br/&gt;
  = /usr/lib64/lustre/tests/sanity.sh:3104:test_27M()&lt;br/&gt;
  = /usr/lib64/lustre/tests/test-framework.sh:6925:run_one()&lt;br/&gt;
  = /usr/lib64/lustre/tests/test-framework.sh:6974:run_one_logged()&lt;br/&gt;
  = /usr/lib64/lustre/tests/test-framework.sh:6811:run_test()&lt;br/&gt;
  = /usr/lib64/lustre/tests/sanity.sh:3181:main()&lt;br/&gt;
Dumping lctl log to /autotest/autotest-2/2023-06-05/lustre-reviews_review-ldiskfs-dne_95319_27_26b27a74-2421-4453-9c33-cd237feca413//sanity.test_27M.*.1685936415.log&lt;br/&gt;
CMD: trevis-129vm1.trevis.whamcloud.com,trevis-129vm2,trevis-129vm3,trevis-129vm4,trevis-129vm5 /usr/sbin/lctl dk &amp;gt; /autotest/autotest-2/2023-06-05/lustre-reviews_review-ldiskfs-dne_95319_27_26b27a74-2421-4453-9c33-cd237feca413//sanity.test_27M.debug_log.\$(hostname -s).1685936415.log;&lt;br/&gt;
		dmesg &amp;gt; /autotest/autotest-2/2023-06-05/lustre-reviews_review-ldiskfs-dne_95319_27_26b27a74-2421-4453-9c33-cd237feca413//sanity.test_27M.dmesg.\$(hostname -s).1685936415.log&lt;br/&gt;
CMD: trevis-129vm4,trevis-129vm5 /usr/sbin/lctl set_param mdd.*.append_stripe_count=1&lt;br/&gt;
mdd.lustre-MDT0000.append_stripe_count=1&lt;br/&gt;
mdd.lustre-MDT0002.append_stripe_count=1&lt;br/&gt;
mdd.lustre-MDT0001.append_stripe_count=1&lt;br/&gt;
mdd.lustre-MDT0003.append_stripe_count=1&lt;br/&gt;
CMD: trevis-129vm4,trevis-129vm5 /usr/sbin/lctl set_param mdd.*.append_pool=none&lt;br/&gt;
mdd.lustre-MDT0000.append_pool=none&lt;br/&gt;
mdd.lustre-MDT0002.append_pool=none&lt;br/&gt;
mdd.lustre-MDT0001.append_pool=none&lt;br/&gt;
mdd.lustre-MDT0003.append_pool=none&lt;/p&gt;
</description>
                <environment></environment>
        <key id="76412">LU-16872</key>
            <summary>sanity: test_27M Error: &apos;(5) stripe count , should be 8 for append&apos;</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="bertschinger">Thomas Bertschinger</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                    </labels>
                <created>Mon, 5 Jun 2023 17:19:26 +0000</created>
                <updated>Tue, 16 Jan 2024 21:34:00 +0000</updated>
                            <resolved>Sat, 19 Aug 2023 12:05:24 +0000</resolved>
                                                    <fixVersion>Lustre 2.16.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>7</watches>
                                                                            <comments>
                            <comment id="375977" author="JIRAUSER18444" created="Tue, 20 Jun 2023 15:08:44 +0000"  >&lt;p&gt;Andreas - I&apos;m away on vacation through June 25 so if this bug needs a quick resolution, you may want to have someone else look into it. Otherwise I&apos;ll continue to work on this when I get back next week.&lt;/p&gt;</comment>
                            <comment id="376856" author="arshad512" created="Thu, 29 Jun 2023 03:41:05 +0000"  >&lt;p&gt;+1 on master (&lt;a href=&quot;https://testing.whamcloud.com/sub_tests/399cef35-a321-43da-944a-84f8ce67c9f1&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/sub_tests/399cef35-a321-43da-944a-84f8ce67c9f1&lt;/a&gt;)&lt;/p&gt;</comment>
                            <comment id="376908" author="JIRAUSER18444" created="Thu, 29 Jun 2023 14:50:04 +0000"  >&lt;p&gt;Here&apos;s a status update since the bug is still causing failures. I&apos;m still looking at this but have not found the root cause yet, but I have a hypothesis.&lt;/p&gt;

&lt;p&gt;The origin of the &lt;tt&gt;EINVAL&lt;/tt&gt; response to the &lt;tt&gt;open()&lt;/tt&gt; call is &lt;tt&gt;lod_alloc_ost_list()&lt;/tt&gt;. From the debug logs, it seems it must be one of these:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
  &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (!test_bit(ost_idx, m-&amp;gt;lod_ost_bitmap)) {
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; rc = -EINVAL;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;break&lt;/span&gt;;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; }
...
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (lod_qos_is_tgt_used(env, ost_idx, stripe_count) &amp;amp;&amp;amp;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; !(lod_comp-&amp;gt;llc_pattern &amp;amp; LOV_PATTERN_OVERSTRIPING)) {
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; rc = -EINVAL;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &lt;span class=&quot;code-keyword&quot;&gt;break&lt;/span&gt;;
&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; } &lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;However, I am fairly confident that &lt;tt&gt;lod_alloc_ost_list()&lt;/tt&gt; should NOT be getting called in the append case at all, because this function appears to be for files with specifically set stripes, e.g., it gets called if a file inherits custom striping from its parent directory.&lt;/p&gt;

&lt;p&gt;Therefore, I believe the actual problem is that &lt;tt&gt;lod_comp-&amp;gt;llc_ostlist.op_array&lt;/tt&gt; and &lt;tt&gt;lod_comp-&amp;gt;llc_ostlist.op_count&lt;/tt&gt; are incorrectly non-zero when the failure occurs. My current hypothesis for the cause is this: the &lt;tt&gt;struct lu_tgt_pool&lt;/tt&gt; inside &lt;tt&gt;struct lod_layout_component&lt;/tt&gt; (where the op_array and op_count fields are) is preceded by &lt;tt&gt;char *llc_pool&lt;/tt&gt; so it&apos;s possible that &lt;tt&gt;char *&lt;/tt&gt; is being overflowed and putting garbage values into the array and count fields. So currently I&apos;m looking at where &lt;tt&gt;llc_pool&lt;/tt&gt; is set and if any of these spots could plausibly have an overflow.&lt;/p&gt;</comment>
                            <comment id="376966" author="JIRAUSER18444" created="Thu, 29 Jun 2023 18:51:47 +0000"  >&lt;p&gt;Oops, I wasn&apos;t thinking straight this morning but overflowing llc_pool wouldn&apos;t affect op_array and op_count since the buffer wouldn&apos;t be adjacent to these fields. So I&apos;m still looking for what could cause op_array and op_count to have bad values. (I still think that&apos;s the most likely explanation for the issue.)&lt;/p&gt;</comment>
                            <comment id="377354" author="gerrit" created="Tue, 4 Jul 2023 13:56:23 +0000"  >&lt;p&gt;&quot;Thomas Bertschinger &amp;lt;bertschinger@lanl.gov&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51559&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51559&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16872&quot; title=&quot;sanity: test_27M Error: &amp;#39;(5) stripe count , should be 8 for append&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16872&quot;&gt;&lt;del&gt;LU-16872&lt;/del&gt;&lt;/a&gt; lod: do not stripe O_APPEND files on specific OSTs&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 81e2439da705dd35dc2c8c687be21cf7dc952eba&lt;/p&gt;</comment>
                            <comment id="377355" author="JIRAUSER18444" created="Tue, 4 Jul 2023 14:08:33 +0000"  >&lt;p&gt;How to reproduce:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-bash&quot;&gt;
&lt;span class=&quot;code-comment&quot;&gt;# setup:
&lt;/span&gt;$ lctl set_param mdd.*.append_stripe_count=-1
$ lfs setstripe -o 1,3 /mnt/lustre

&lt;span class=&quot;code-comment&quot;&gt;# touch enough files with the default striping so that every mdt kernel thread probably has the defaults stored &lt;span class=&quot;code-object&quot;&gt;in&lt;/span&gt; its memory
&lt;/span&gt;$ &lt;span class=&quot;code-object&quot;&gt;for&lt;/span&gt; i &lt;span class=&quot;code-object&quot;&gt;in&lt;/span&gt; {0..100}; &lt;span class=&quot;code-object&quot;&gt;do&lt;/span&gt; touch /mnt/lustre/x&lt;span class=&quot;code-object&quot;&gt;$i&lt;/span&gt;; &lt;span class=&quot;code-object&quot;&gt;done&lt;/span&gt;

&lt;span class=&quot;code-comment&quot;&gt;# now an append should return EINVAL as long as it gets handled by a kernel thread that previously did a create with default stripes
&lt;/span&gt;$ echo 1 &amp;gt;&amp;gt; /mnt/lustre/f
-bash: /mnt/lustre/g: Invalid argument&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;A closely related problem occurs when an append_pool is set, but in this case, the create succeeds, but the append file is created with the default stripes rather than the pool.&lt;/p&gt;

&lt;p&gt;I haven&apos;t identified which patch caused (or uncovered) the issue yet &#8211; I didn&apos;t see anything obvious in the patches merged shortly before the first test failure occurred. So I&apos;ll attempt a git bisect to try to find what caused this and will update if I get that answer.&lt;/p&gt;</comment>
                            <comment id="377964" author="gerrit" created="Fri, 7 Jul 2023 20:05:13 +0000"  >&lt;p&gt;&quot;Andreas Dilger &amp;lt;adilger@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51602&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51602&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16872&quot; title=&quot;sanity: test_27M Error: &amp;#39;(5) stripe count , should be 8 for append&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16872&quot;&gt;&lt;del&gt;LU-16872&lt;/del&gt;&lt;/a&gt; tests: exercise sanity test_27M more fully&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 221a2d05d5d4ec2b39c88c6a5d84df2ba3f177dc&lt;/p&gt;</comment>
                            <comment id="383040" author="gerrit" created="Sat, 19 Aug 2023 05:33:38 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51559/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51559/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16872&quot; title=&quot;sanity: test_27M Error: &amp;#39;(5) stripe count , should be 8 for append&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16872&quot;&gt;&lt;del&gt;LU-16872&lt;/del&gt;&lt;/a&gt; lod: reset llc_ostlist when using O_APPEND stripes&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 766b35a9700f36aa08b652fa9d18b890d34bf4a5&lt;/p&gt;</comment>
                            <comment id="383041" author="gerrit" created="Sat, 19 Aug 2023 05:33:55 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51602/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51602/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-16872&quot; title=&quot;sanity: test_27M Error: &amp;#39;(5) stripe count , should be 8 for append&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-16872&quot;&gt;&lt;del&gt;LU-16872&lt;/del&gt;&lt;/a&gt; tests: exercise sanity test_27M more fully&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 7bb1685048bf999df03ceadab39faa09b8a5560d&lt;/p&gt;</comment>
                            <comment id="383065" author="pjones" created="Sat, 19 Aug 2023 12:05:24 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="71157">LU-16014</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="72280">LU-16147</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="75107">LU-16648</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="53114">LU-11279</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="69596">LU-15727</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="75107">LU-16648</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i03n6f:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>