<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:58:55 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-13162] parallel-scale test_statahead: mdsrate invoked oom-killer</title>
                <link>https://jira.whamcloud.com/browse/LU-13162</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;This issue was created by maloo for jianyu &amp;lt;yujian@whamcloud.com&amp;gt;&lt;/p&gt;

&lt;p&gt;This issue relates to the following test suite run: &lt;a href=&quot;https://testing.whamcloud.com/test_sets/0925c456-3ba8-11ea-bb75-52540065bddc&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.whamcloud.com/test_sets/0925c456-3ba8-11ea-bb75-52540065bddc&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;test_statahead failed with the following error:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;+ su mpiuser sh -c &quot;/usr/lib64/openmpi/bin/mpirun --mca btl tcp,self --mca btl_tcp_if_include eth0 -mca boot ssh --oversubscribe -machinefile /tmp/auster.machines -np 64 /usr/lib64/openmpi/bin/mdsrate --mknod --dir /mnt/lustre/dstatahead --nfiles 160711 --filefmt &apos;f%%d&apos; &quot;
[1579521814.463727] [trevis-12vm6:7395 :0]            cpu.c:52   UCX  WARN  CPU does not support invariant TSC, time may be unstable
[1579522133.063761] [trevis-12vm7:26045:0]            cpu.c:52   UCX  WARN  CPU does not support invariant TSC, time may be unstable
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Clients crashed:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[69145.465824] Lustre: DEBUG MARKER: == parallel-scale test statahead: statahead test, multiple clients =================================== 12:03:31 (1579521811)
[69145.622411] Lustre: lustre-OST0000-osc-ffff9d88618a4800: reconnect after 7127s idle
[69166.377333] Lustre: lustre-OST0000-osc-ffff9d88618a4800: disconnect after 21s idle
[69173.846404] mdsrate invoked oom-killer: gfp_mask=0x6280ca(GFP_HIGHUSER_MOVABLE|__GFP_ZERO), nodemask=(null), order=0, oom_score_adj=0
[69173.848578] mdsrate cpuset=/ mems_allowed=0
[69173.849368] CPU: 1 PID: 7399 Comm: mdsrate Kdump: loaded Tainted: G           OE    --------- -  - 4.18.0-147.3.1.el8_1.x86_64 #1
[69173.851539] Hardware name: Red Hat KVM, BIOS 0.5.1 01/01/2011
[69173.852562] Call Trace:
[69173.853154]  dump_stack+0x5c/0x80
[69173.853821]  dump_header+0x6e/0x27a
[69173.854515]  ? notifier_call_chain+0x47/0x70
[69173.855409]  out_of_memory.cold.32+0xa/0x80
[69173.856169]  __alloc_pages_slowpath+0xc0f/0xce0
[69173.856982]  __alloc_pages_nodemask+0x245/0x280
[69173.857837]  alloc_pages_vma+0x74/0x1d0
[69173.858574]  do_anonymous_page+0x90/0x370
[69173.859325]  __handle_mm_fault+0x66e/0x6b0
[69173.860069]  handle_mm_fault+0xda/0x200
[69173.860764]  __get_user_pages+0x255/0x7c0
[69173.861541]  ? _cond_resched+0x15/0x30
[69173.862230]  get_user_pages+0x3e/0x50
[69173.862898]  get_user_pages_longterm+0x34/0x190
[69173.863772]  ib_umem_get+0x2ee/0x520 [ib_core]
[69173.864602]  mlx4_ib_reg_user_mr+0x71/0x1e0 [mlx4_ib]
[69173.865519]  ib_uverbs_reg_mr+0x143/0x240 [ib_uverbs]
[69173.866428]  ? __blk_mq_run_hw_queue+0x51/0xd0
[69173.867218]  ib_uverbs_handler_UVERBS_METHOD_INVOKE_WRITE+0xb1/0xf0 [ib_uverbs]
[69173.868475]  ib_uverbs_run_method+0x20c/0x7a0 [ib_uverbs]
[69173.869438]  ? __switch_to_asm+0x35/0x70
[69173.870146]  ? uverbs_disassociate_api+0x100/0x100 [ib_uverbs]
[69173.871155]  ? __switch_to_asm+0x41/0x70
[69173.871858]  ? __switch_to_asm+0x35/0x70
[69173.872566]  ib_uverbs_cmd_verbs+0x189/0x380 [ib_uverbs]
[69173.873490]  ? __switch_to_asm+0x41/0x70
[69173.874196]  ? __switch_to_asm+0x35/0x70
[69173.874898]  ? __switch_to_asm+0x41/0x70
[69173.875600]  ? __switch_to_asm+0x35/0x70
[69173.876315]  ? __switch_to+0x115/0x480
[69173.876999]  ? finish_task_switch+0x76/0x2b0
[69173.877765]  ? free_swap_slot+0x9a/0xf0
[69173.878446]  ? wp_page_reuse+0x4d/0x60
[69173.879128]  ? __raw_spin_unlock+0x5/0x10
[69173.879844]  ? do_wp_page+0x217/0x310
[69173.880501]  ? __handle_mm_fault+0x67e/0x6b0
[69173.881267]  ib_uverbs_ioctl+0xa3/0x100 [ib_uverbs]
[69173.882139]  do_vfs_ioctl+0xa4/0x630
[69173.882806]  ? __x64_sys_madvise+0x4a6/0x790
[69173.883573]  ? syscall_trace_enter+0x1d3/0x2c0
[69173.884356]  ksys_ioctl+0x60/0x90
[69173.884963]  __x64_sys_ioctl+0x16/0x20
[69173.885640]  do_syscall_64+0x5b/0x1b0
[69173.886311]  entry_SYSCALL_64_after_hwframe+0x65/0xca
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;





&lt;p&gt;VVVVVVV DO NOT REMOVE LINES BELOW, Added by Maloo for auto-association VVVVVVV&lt;br/&gt;
parallel-scale test_statahead - trevis-12vm6, trevis-12vm7 crashed during parallel-scale test_statahead&lt;/p&gt;</description>
                <environment>RHEL 8.1 client + RHEL 7.7 server</environment>
        <key id="57845">LU-13162</key>
            <summary>parallel-scale test_statahead: mdsrate invoked oom-killer</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="ys">Yang Sheng</assignee>
                                    <reporter username="maloo">Maloo</reporter>
                        <labels>
                            <label>rhel8</label>
                    </labels>
                <created>Tue, 21 Jan 2020 08:07:03 +0000</created>
                <updated>Tue, 23 Feb 2021 17:05:49 +0000</updated>
                            <resolved>Wed, 17 Feb 2021 22:23:53 +0000</resolved>
                                    <version>Lustre 2.13.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="261587" author="pjones" created="Tue, 21 Jan 2020 18:47:14 +0000"  >&lt;p&gt;Yang Sheng&lt;/p&gt;

&lt;p&gt;Could you please investigate?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="262483" author="ys" created="Mon, 3 Feb 2020 21:37:50 +0000"  >&lt;p&gt;Hi, Yujian,&lt;/p&gt;

&lt;p&gt;Do you know the &apos;panic_on_oom is enabled&apos; is default set in rhel8.1 or we set it intentional on our test system?&lt;/p&gt;

&lt;p&gt;Thanks,&lt;br/&gt;
YangSheng&lt;/p&gt;</comment>
                            <comment id="263071" author="ys" created="Tue, 11 Feb 2020 14:24:35 +0000"  >&lt;p&gt;Duplicated with &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11424&quot; title=&quot;incorrect amount of cpts copied to lnet_cpts&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11424&quot;&gt;&lt;del&gt;LU-11424&lt;/del&gt;&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="57093">LU-12830</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i00san:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>