<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 03:09:12 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-14377] parallel-scale test rr_alloc fails with &apos;&apos;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&apos;&apos;</title>
                <link>https://jira.whamcloud.com/browse/LU-14377</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;parallel-scale test_rr_alloc fails with &apos;&apos;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&apos;&apos;. It looks like this test has been failing since at least 22 NOV 2019 with&lt;br/&gt;
Lustre 2.12.3.31 - &lt;a href=&quot;https://testing.whamcloud.com/test_sets/b8fa5b22-0d76-11ea-98f1-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/b8fa5b22-0d76-11ea-98f1-52540065bddc&lt;/a&gt;&lt;br/&gt;
Lustre 2.13.51.72 - &lt;a href=&quot;https://testing.whamcloud.com/test_sets/32e5a306-44f4-11ea-8072-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/32e5a306-44f4-11ea-8072-52540065bddc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Since 2020-06-11, this test is occasionally failing.&lt;/p&gt;

&lt;p&gt;Looking at the test_suite log for the failure at &lt;a href=&quot;https://testing.whamcloud.com/test_sets/875e0375-cc23-4f0f-8291-f4f9034e340c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/875e0375-cc23-4f0f-8291-f4f9034e340c&lt;/a&gt;, we see &lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;+ su mpiuser sh -c &quot;/usr/lib64/openmpi/bin/mpirun --mca btl tcp,self --mca btl_tcp_if_include eth0 -mca boot ssh --oversubscribe -np 22 /usr/lib64/openmpi/bin/rr_alloc /tmp/rr_alloc_mntpt/lustre/drr_alloc.parallel-scale/ash 555 2 &quot;
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n lod.lustre-MDT0000-mdtlov.qos_threshold_rr=17%
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0000-osc-MDT0000.create_count=1024
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0001-osc-MDT0000.create_count=1024
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0002-osc-MDT0000.create_count=1024
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0003-osc-MDT0000.create_count=2048
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0004-osc-MDT0000.create_count=2048
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0005-osc-MDT0000.create_count=2048
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0006-osc-MDT0000.create_count=1024
CMD: trevis-63vm4 /usr/sbin/lctl set_param -n osp.lustre-OST0007-osc-MDT0000.create_count=2048
 parallel-scale test_rr_alloc: @@@@@@ FAIL: Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2 
  Trace dump:
  = /usr/lib64/lustre/tests/test-framework.sh:6273:error()
  = /usr/lib64/lustre/tests/functions.sh:1120:run_rr_alloc()
  = /usr/lib64/lustre/tests/parallel-scale.sh:163:test_rr_alloc()
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;which, except for the error message, is the same command and values for create_count seen when this test passes. &lt;/p&gt;

&lt;p&gt;From functions.sh/run_rr_alloc(), here is how we compute the differences between number of stripes created per OST&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
1095         &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; [[ $total_MNTPTS -ne 0 ]]; then
1096                 # Now start the actual file creation app.
1097                 mpi_run &lt;span class=&quot;code-quote&quot;&gt;&quot;-np $total_MNTPTS&quot;&lt;/span&gt; $cmd || &lt;span class=&quot;code-keyword&quot;&gt;return&lt;/span&gt;
1098         &lt;span class=&quot;code-keyword&quot;&gt;else&lt;/span&gt;
1099                 error &lt;span class=&quot;code-quote&quot;&gt;&quot;No mount point&quot;&lt;/span&gt;
1100         fi
1101 
1102         restore_lustre_params &amp;lt; $qos_prec_objs
1103         rm -f $qos_prec_objs
1104 
1105         diff_max_min_arr=($($LFS getstripe -r $DIR/$tdir/ |
1106                 grep &lt;span class=&quot;code-quote&quot;&gt;&quot;lmm_stripe_offset:&quot;&lt;/span&gt; | awk &lt;span class=&quot;code-quote&quot;&gt;&apos;{print $2}&apos;&lt;/span&gt; | sort -n |
1107                 uniq -c | awk &apos;NR==1 {min=max=$1} \
1108                 { $1&amp;lt;min ? min=$1 : min; $1&amp;gt;max ? max=$1 : max} \
1109                 END {print max-min, max, min}&apos;))
1110 
1111         rm -rf $DIR/$tdir
1112 
1113         # In-&lt;span class=&quot;code-keyword&quot;&gt;case&lt;/span&gt; of fairly large number of file creation using RR (round-robin)
1114         # there can be two cases in which deviation will occur than the regular
1115         # RR algo behaviour-
1116         # 1- When rr_alloc does not start right with &lt;span class=&quot;code-quote&quot;&gt;&apos;lqr_start_count&apos;&lt;/span&gt; reseeded,
1117         # 2- When rr_alloc does not finish with &lt;span class=&quot;code-quote&quot;&gt;&apos;lqr_start_count == 0&apos;&lt;/span&gt;.
1118         # So the difference of files b/w any 2 OST should not be more than 2.
1119         [[ ${diff_max_min_arr[0]} -le 2 ]] ||
1120                 error &lt;span class=&quot;code-quote&quot;&gt;&quot;Uneven distribution detected: difference between&quot;&lt;/span&gt; \
1121                 &lt;span class=&quot;code-quote&quot;&gt;&quot;maximum files per OST (${diff_max_min_arr[1]}) and&quot;&lt;/span&gt; \
1122                 &lt;span class=&quot;code-quote&quot;&gt;&quot;minimum files per OST (${diff_max_min_arr[2]}) must not be&quot;&lt;/span&gt; \
1123                 &lt;span class=&quot;code-quote&quot;&gt;&quot;greater than 2&quot;&lt;/span&gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>ZFS</environment>
        <key id="62543">LU-14377</key>
            <summary>parallel-scale test rr_alloc fails with &apos;&apos;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&apos;&apos;</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="adilger">Andreas Dilger</assignee>
                                    <reporter username="jamesanunez">James Nunez</reporter>
                        <labels>
                    </labels>
                <created>Thu, 28 Jan 2021 03:29:39 +0000</created>
                <updated>Fri, 3 Nov 2023 00:33:45 +0000</updated>
                            <resolved>Fri, 3 Nov 2023 00:33:45 +0000</resolved>
                                    <version>Lustre 2.14.0</version>
                    <version>Lustre 2.12.4</version>
                    <version>Lustre 2.15.1</version>
                    <version>Lustre 2.15.3</version>
                                    <fixVersion>Lustre 2.16.0</fixVersion>
                    <fixVersion>Lustre 2.15.4</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="334986" author="nangelinas" created="Mon, 16 May 2022 17:55:17 +0000"  >&lt;p&gt;+1 on master: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/d09310fb-2944-46a6-84e3-67634a12f39d&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/d09310fb-2944-46a6-84e3-67634a12f39d&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="341916" author="sarah" created="Thu, 28 Jul 2022 18:04:27 +0000"  >&lt;p&gt;+1 in 2.15.1 &lt;a href=&quot;https://testing.whamcloud.com/test_sets/59410f79-0bed-4fd3-97fc-e80941e5a00c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/59410f79-0bed-4fd3-97fc-e80941e5a00c&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="350079" author="gerrit" created="Wed, 19 Oct 2022 01:29:48 +0000"  >&lt;p&gt;&quot;Andreas Dilger &amp;lt;adilger@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/48914&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/48914&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14377&quot; title=&quot;parallel-scale test rr_alloc fails with &amp;#39;&amp;#39;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&amp;#39;&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14377&quot;&gt;&lt;del&gt;LU-14377&lt;/del&gt;&lt;/a&gt; tests: make parallel-scale/rr_alloc less strict&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: e5456735dbb92dbb438bef45cdf8cbfc55ce99cc&lt;/p&gt;</comment>
                            <comment id="352106" author="gerrit" created="Tue, 8 Nov 2022 08:53:03 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/48914/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/48914/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14377&quot; title=&quot;parallel-scale test rr_alloc fails with &amp;#39;&amp;#39;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&amp;#39;&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14377&quot;&gt;&lt;del&gt;LU-14377&lt;/del&gt;&lt;/a&gt; tests: make parallel-scale/rr_alloc less strict&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: b104c0a27713899a4d047f56fed57c30c39b8195&lt;/p&gt;</comment>
                            <comment id="352146" author="pjones" created="Tue, 8 Nov 2022 13:57:42 +0000"  >&lt;p&gt;Landed for 2.16&lt;/p&gt;</comment>
                            <comment id="373487" author="gerrit" created="Thu, 25 May 2023 16:55:35 +0000"  >&lt;p&gt;&quot;Minh Diep &amp;lt;mdiep@whamcloud.com&amp;gt;&quot; uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51142&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51142&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14377&quot; title=&quot;parallel-scale test rr_alloc fails with &amp;#39;&amp;#39;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&amp;#39;&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14377&quot;&gt;&lt;del&gt;LU-14377&lt;/del&gt;&lt;/a&gt; tests: make parallel-scale/rr_alloc less strict&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 1194fd9de1d3853482a5c51574cd4ba91f1ce9ab&lt;/p&gt;</comment>
                            <comment id="381012" author="gerrit" created="Wed, 2 Aug 2023 06:16:06 +0000"  >&lt;p&gt;&quot;Oleg Drokin &amp;lt;green@whamcloud.com&amp;gt;&quot; merged in patch &lt;a href=&quot;https://review.whamcloud.com/c/fs/lustre-release/+/51142/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/c/fs/lustre-release/+/51142/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-14377&quot; title=&quot;parallel-scale test rr_alloc fails with &amp;#39;&amp;#39;Uneven distribution detected: difference between maximum files per OST (1528) and minimum files per OST (1525) must not be greater than 2&amp;#39;&amp;#39;&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-14377&quot;&gt;&lt;del&gt;LU-14377&lt;/del&gt;&lt;/a&gt; tests: make parallel-scale/rr_alloc less strict&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_15&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: c0b60c0c79a2d5d5be651570564d6d0407457a5f&lt;/p&gt;</comment>
                            <comment id="383984" author="adilger" created="Mon, 28 Aug 2023 19:17:09 +0000"  >&lt;p&gt;This is still failing regularly, often with very large differences between the most and least used OSTs (i.e. 90% difference instead  of just 2-3%  difference).   So it seems either  that the test as written is unreliable (creating too many objects, running on an already-imbalanced system, etc.), or there is a new bug in the code.&lt;/p&gt;</comment>
                            <comment id="391570" author="adilger" created="Fri, 3 Nov 2023 00:33:45 +0000"  >&lt;p&gt;Patches already landed for this ticket, new ticket &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17251&quot; title=&quot;parallel-scale test_rr_alloc: max/min OST objects (2800 : 923) too different&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17251&quot;&gt;LU-17251&lt;/a&gt; tracking new patches.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="47324">LU-9780</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="78724">LU-17251</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="12848">LU-977</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i01kjz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>