<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:46:07 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-11693] Soft lockups on Lustre clients</title>
                <link>https://jira.whamcloud.com/browse/LU-11693</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;We get quite a few soft lockups on our Lustre gateways (Lustre clients that export Lustre filesystems over NFS). Example:&lt;/p&gt;

&lt;p&gt;Nov 13 00:26:06 foxtrot2 kernel: NMI watchdog: BUG: soft lockup - CPU#0 stuck for 23s! &lt;span class=&quot;error&quot;&gt;&amp;#91;nfsd:11973&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: NMI watchdog: BUG: soft lockup - CPU#1 stuck for 23s! &lt;span class=&quot;error&quot;&gt;&amp;#91;rsync:36079&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: Modules linked in: vfat fat dm_service_time mpt3sas mpt2sas raid_class scsi_transport_sas mptctl mptb&lt;br/&gt;
ase nfsv3 nfs fscache osc(OE) mgc(OE) lustre(OE) lmv(OE) mdc(OE) lov(OE) fid(OE) fld(OE) ksocklnd(OE) ptlrpc(OE) obdclass(OE) lnet(OE)&lt;br/&gt;
 dell_rbu libcfs(OE) bonding sb_edac edac_core intel_powerclamp coretemp intel_rapl iosf_mbi kvm_intel iTCO_wdt iTCO_vendor_support kv&lt;br/&gt;
m joydev dcdbas irqbypass sg shpchp ipmi_si ipmi_devintf ipmi_msghandler lpc_ich mei_me mei acpi_power_meter acpi_pad nfsd auth_rpcgss&lt;br/&gt;
 nfs_acl lockd grace binfmt_misc ip_tables xfs sd_mod crc_t10dif crct10dif_generic 8021q garp stp llc mrp mgag200 i2c_algo_bit drm_kms&lt;br/&gt;
_helper scsi_transport_iscsi bnx2x syscopyarea sysfillrect sysimgblt fb_sys_fops ttm crct10dif_pclmul crct10dif_common crc32_pclmul cr&lt;br/&gt;
c32c_intel ahci drm ghash_clmulni_intel&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: libahci aesni_intel dm_multipath libata lrw gf128mul glue_helper ablk_helper cryptd megaraid_sas i2c_&lt;br/&gt;
core ptp pps_core mdio libcrc32c wmi sunrpc dm_mirror dm_region_hash dm_log dm_mod &lt;span class=&quot;error&quot;&gt;&amp;#91;last unloaded: usb_storage&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: CPU: 1 PID: 36079 Comm: rsync Tainted: G W OE ------------ 3.10.0-693.5.2.el7_lustre.x86_6&lt;br/&gt;
4 #1&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: Hardware name: Dell Inc. PowerEdge R620/01W23F, BIOS 2.5.4 01/22/2016&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: task: ffff883ff8a04f10 ti: ffff8815a1200000 task.ti: ffff8815a1200000&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: RIP: 0010:&lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810fa332&amp;gt;&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810fa332&amp;gt;&amp;#93;&lt;/span&gt; native_queued_spin_lock_slowpath+0x112/0x1e0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: RSP: 0018:ffff8815a1203700 EFLAGS: 00000246&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: RAX: 0000000000000000 RBX: ffff883fff017880 RCX: 0000000000090000&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: RDX: ffff883fff4d7880 RSI: 0000000001390101 RDI: ffff881ff99da818&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: RBP: ffff8815a1203700 R08: ffff883fff017880 R09: 0000000000000000&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: R10: 0004c5dab524ba0b R11: 0000000000000000 R12: 0004c5dab524ba0b&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: R13: 0000000000000000 R14: 0004c5dab39dc857 R15: ffff8815a12036e8&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: FS: 00007f0ff1094740(0000) GS:ffff883fff000000(0000) knlGS:0000000000000000&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: CS: 0010 DS: 0000 ES: 0000 CR0: 0000000080050033&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: CR2: 00007fd6cb1e9000 CR3: 000000163eff9000 CR4: 00000000001407e0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: Stack:&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: ffff8815a1203710 ffffffff8169e6bf ffff8815a1203720 ffffffff816abbf0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: ffff8815a12037a0 ffffffffc0c2d421 ffff8815a12037e0 ffffffffc0c2ba60&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: 0000000000000000 00000161000ab602 0004c5dab524ba0b ffff88130fb65c00&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: Call Trace:&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8169e6bf&amp;gt;&amp;#93;&lt;/span&gt; queued_spin_lock_slowpath+0xb/0xf&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff816abbf0&amp;gt;&amp;#93;&lt;/span&gt; _raw_spin_lock+0x20/0x30&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c2d421&amp;gt;&amp;#93;&lt;/span&gt; ldlm_prepare_lru_list+0x361/0x4e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c2ba60&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cancel_aged_no_wait_policy+0x70/0x70 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c30c5a&amp;gt;&amp;#93;&lt;/span&gt; ldlm_cancel_lru_local+0x1a/0x30 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c30e8e&amp;gt;&amp;#93;&lt;/span&gt; ldlm_prep_elc_req+0x21e/0x490 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c31128&amp;gt;&amp;#93;&lt;/span&gt; ldlm_prep_enqueue_req+0x28/0x30 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc07c67a3&amp;gt;&amp;#93;&lt;/span&gt; mdc_intent_getattr_pack.isra.15+0x93/0x280 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc07c8f3b&amp;gt;&amp;#93;&lt;/span&gt; mdc_enqueue_base+0x9fb/0x18f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810c45a3&amp;gt;&amp;#93;&lt;/span&gt; ? try_to_wake_up+0x183/0x340&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810ba598&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up_common+0x58/0x90&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc07ca6cb&amp;gt;&amp;#93;&lt;/span&gt; mdc_intent_lock+0x26b/0x520 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c66243&amp;gt;&amp;#93;&lt;/span&gt; ? reply_in_callback+0x143/0x5e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0972e30&amp;gt;&amp;#93;&lt;/span&gt; ? ll_invalidate_negative_children+0x1d0/0x1d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0c2c7a0&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_expired_completion_wait+0x240/0x240 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0910e4f&amp;gt;&amp;#93;&lt;/span&gt; lmv_intent_lock+0x5cf/0x1b50 &lt;span class=&quot;error&quot;&gt;&amp;#91;lmv&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810b8a01&amp;gt;&amp;#93;&lt;/span&gt; ? in_group_p+0x31/0x40&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc09738c5&amp;gt;&amp;#93;&lt;/span&gt; ? ll_i2suppgid+0x15/0x40 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0973914&amp;gt;&amp;#93;&lt;/span&gt; ? ll_i2gids+0x24/0xb0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81114b02&amp;gt;&amp;#93;&lt;/span&gt; ? from_kgid+0x12/0x20&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0972e30&amp;gt;&amp;#93;&lt;/span&gt; ? ll_invalidate_negative_children+0x1d0/0x1d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0974feb&amp;gt;&amp;#93;&lt;/span&gt; ll_lookup_it+0x29b/0xee0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810c8f28&amp;gt;&amp;#93;&lt;/span&gt; ? __enqueue_entity+0x78/0x80&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffc0976fbb&amp;gt;&amp;#93;&lt;/span&gt; ll_lookup_nd+0xbb/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8120b3dd&amp;gt;&amp;#93;&lt;/span&gt; lookup_real+0x1d/0x50&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8120bcb2&amp;gt;&amp;#93;&lt;/span&gt; __lookup_hash+0x42/0x60&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff816a13e2&amp;gt;&amp;#93;&lt;/span&gt; lookup_slow+0x42/0xa7&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8120f25b&amp;gt;&amp;#93;&lt;/span&gt; path_lookupat+0x77b/0x7b0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811df623&amp;gt;&amp;#93;&lt;/span&gt; ? kmem_cache_alloc+0x193/0x1e0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81211c9f&amp;gt;&amp;#93;&lt;/span&gt; ? getname_flags+0x4f/0x1a0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8120f2bb&amp;gt;&amp;#93;&lt;/span&gt; filename_lookup+0x2b/0xc0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81212e37&amp;gt;&amp;#93;&lt;/span&gt; user_path_at_empty+0x67/0xc0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81212ea1&amp;gt;&amp;#93;&lt;/span&gt; user_path_at+0x11/0x20&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff812063e3&amp;gt;&amp;#93;&lt;/span&gt; vfs_fstatat+0x63/0xc0&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff812069b1&amp;gt;&amp;#93;&lt;/span&gt; SYSC_newlstat+0x31/0x60&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81206c3e&amp;gt;&amp;#93;&lt;/span&gt; SyS_newlstat+0xe/0x10&lt;br/&gt;
Nov 13 00:26:06 foxtrot2 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff816b5089&amp;gt;&amp;#93;&lt;/span&gt; system_call_fastpath+0x16/0x1b&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</description>
                <environment></environment>
        <key id="54092">LU-11693</key>
            <summary>Soft lockups on Lustre clients</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="1" iconUrl="https://jira.whamcloud.com/images/icons/statuses/open.png" description="The issue is open and ready for the assignee to start work on it.">Open</status>
                    <statusCategory id="2" key="new" colorName="default"/>
                                    <resolution id="-1">Unresolved</resolution>
                                        <assignee username="yujian">Jian Yu</assignee>
                                    <reporter username="cmcl">Campbell Mcleay</reporter>
                        <labels>
                    </labels>
                <created>Thu, 22 Nov 2018 14:59:50 +0000</created>
                <updated>Thu, 28 Feb 2019 10:44:32 +0000</updated>
                                            <version>Lustre 2.10.2</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="237390" author="cmcl" created="Thu, 22 Nov 2018 15:08:28 +0000"  >&lt;p&gt;Versions are:&lt;/p&gt;

&lt;p&gt;lustre-2.10.2-1.el7&lt;/p&gt;

&lt;p&gt;kernel-3.10.0-693.5.2.el7_lustre&lt;/p&gt;</comment>
                            <comment id="237392" author="adilger" created="Thu, 22 Nov 2018 17:30:04 +0000"  >&lt;p&gt;This looks like a duplicate of a previously-reported issue.  Please try:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;# lctl set_param ldlm.namespaces.*.lru_size=10000
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;On these clients to see if this avoids the issue?&lt;/p&gt;</comment>
                            <comment id="237393" author="cmcl" created="Thu, 22 Nov 2018 17:49:44 +0000"  >&lt;p&gt;Hi Andreas,&lt;/p&gt;

&lt;p&gt;I think we set this already, when I run:&lt;/p&gt;

&lt;p&gt;lctl get_param &apos;ldlm.namespaces.*.lru_size&apos;&lt;/p&gt;

&lt;p&gt;I get:&lt;/p&gt;

&lt;p&gt;ldlm.namespaces.MGC10.21.22.10@tcp.lru_size=10000&lt;/p&gt;

&lt;p&gt;where&#160;10.21.22.10 is our MDS&lt;/p&gt;

&lt;p&gt;Thanks,&lt;/p&gt;

&lt;p&gt;Campbell&lt;/p&gt;</comment>
                            <comment id="237394" author="cmcl" created="Thu, 22 Nov 2018 17:55:14 +0000"  >&lt;p&gt;I should mention it prints out a list of values for all the OSTs and the MDT which are larger than this value, e.g.,&#160;&lt;/p&gt;

&lt;p&gt;ldlm.namespaces.foxtrot-MDT0000-mdc-ffff883ff9b89000.lru_size=246531&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0000-osc-ffff883ff9b89000.lru_size=17716&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0001-osc-ffff883ff9b89000.lru_size=17472&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0002-osc-ffff883ff9b89000.lru_size=17561&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0003-osc-ffff883ff9b89000.lru_size=17628&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0004-osc-ffff883ff9b89000.lru_size=17492&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0005-osc-ffff883ff9b89000.lru_size=17555&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0006-osc-ffff883ff9b89000.lru_size=17334&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0007-osc-ffff883ff9b89000.lru_size=17511&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0008-osc-ffff883ff9b89000.lru_size=17534&lt;br/&gt;
ldlm.namespaces.foxtrot-OST0009-osc-ffff883ff9b89000.lru_size=17689&lt;br/&gt;
ldlm.namespaces.foxtrot-OST000a-osc-ffff883ff9b89000.lru_size=17609&lt;br/&gt;
ldlm.namespaces.foxtrot-OST000b-osc-ffff883ff9b89000.lru_size=17144&lt;br/&gt;
ldlm.namespaces.foxtrot-OST000c-osc-ffff883ff9b89000.lru_size=17438&lt;/p&gt;

&lt;p&gt;etc&lt;/p&gt;

&lt;p&gt;in case that is important&lt;/p&gt;</comment>
                            <comment id="237397" author="adilger" created="Thu, 22 Nov 2018 22:13:29 +0000"  >&lt;p&gt;The patch &lt;a href=&quot;https://review.whamcloud.com/33130&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33130&lt;/a&gt; &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9230&quot; title=&quot;soft lockup on v2.9 Lustre clients (ldlm?)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9230&quot;&gt;&lt;del&gt;LU-9230&lt;/del&gt;&lt;/a&gt; ldlm: speed up preparation for list of lock cancel&quot; should resolve the CPU contention in &lt;tt&gt;ldlm_prepare_lru_list()&lt;/tt&gt; that you are seeing here.&lt;/p&gt;

&lt;p&gt;This patch has been landed to the master branch (for 2.12) for over 6 months and has seen a lot of testing already.  It is in the process of landing to the b2_10 branch for the next 2.10.x release, so there is not yet a release package available with this patch included.  It is a client-only patch, so could be installed on the affected nodes without taking down the whole system.&lt;/p&gt;</comment>
                            <comment id="238000" author="cmcl" created="Wed, 5 Dec 2018 15:21:39 +0000"  >&lt;p&gt;Thanks Andreas. I was looking for a compatibility matrix to see whether 2.12 on the client is compatible with 2.10 on the server. Is there something available online that shows compatibility of releases?&#160;&lt;/p&gt;

&lt;p&gt;regards,&lt;/p&gt;

&lt;p&gt;Campbell&lt;/p&gt;</comment>
                            <comment id="238001" author="cmcl" created="Wed, 5 Dec 2018 15:23:26 +0000"  >&lt;p&gt;Actually, I see that 2.12 is not listed as supported by Whamcloud. I&apos;ll patch it then.&lt;/p&gt;</comment>
                            <comment id="238002" author="pjones" created="Wed, 5 Dec 2018 15:30:02 +0000"  >&lt;p&gt;Campbell&lt;/p&gt;

&lt;p&gt;2.12 is very close to release - we tagged the first RC yesterday. So, upon GA, another option to patching will be to use a 2.12 client as this interoperates with 2.10.x servers ok.&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="238016" author="cmcl" created="Wed, 5 Dec 2018 18:40:29 +0000"  >&lt;p&gt;Thanks Peter. I applied the patches for both the crashes and the lockups to 2.10.2-1 source and it fails to build. Can you tell me what I need to do here? Attached is the build log&#160;&lt;span class=&quot;nobr&quot;&gt;&lt;a href=&quot;https://jira.whamcloud.com/secure/attachment/31577/31577_build.log&quot; title=&quot;build.log attached to LU-11693&quot;&gt;build.log&lt;sup&gt;&lt;img class=&quot;rendericon&quot; src=&quot;https://jira.whamcloud.com/images/icons/link_attachment_7.gif&quot; height=&quot;7&quot; width=&quot;7&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/sup&gt;&lt;/a&gt;&lt;/span&gt;&lt;/p&gt;</comment>
                            <comment id="238017" author="pjones" created="Wed, 5 Dec 2018 18:43:52 +0000"  >&lt;p&gt;Jian&lt;/p&gt;

&lt;p&gt;Could you please assist Campbell in porting the fix for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9230&quot; title=&quot;soft lockup on v2.9 Lustre clients (ldlm?)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9230&quot;&gt;&lt;del&gt;LU-9230&lt;/del&gt;&lt;/a&gt; to 2.10.2?&lt;/p&gt;

&lt;p&gt;thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="238019" author="cmcl" created="Wed, 5 Dec 2018 18:48:44 +0000"  >&lt;p&gt;I&apos;m also happy to apply the patches to a later supported release if that is easier...&lt;/p&gt;</comment>
                            <comment id="238020" author="pjones" created="Wed, 5 Dec 2018 18:51:27 +0000"  >&lt;p&gt;Jian&lt;/p&gt;

&lt;p&gt;The port already exists to b2_10 - &lt;a href=&quot;https://review.whamcloud.com/#/c/33130/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/33130/&lt;/a&gt;&#160;- but does it need refreshing to apply to the tip of b2_10 or else to the 2.10.5 release?&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="238025" author="yujian" created="Wed, 5 Dec 2018 20:11:30 +0000"  >&lt;p&gt;Hi Peter,&lt;br/&gt;
I just checked that the patch can be applied cleanly to both the tip of b2_10 and 2.10.5 release.&lt;/p&gt;</comment>
                            <comment id="238036" author="yujian" created="Wed, 5 Dec 2018 21:29:26 +0000"  >&lt;p&gt;Hi Campbell,&lt;br/&gt;
Patch &lt;a href=&quot;https://review.whamcloud.com/33130&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33130&lt;/a&gt; is now on the tip of Lustre b2_10 branch. Please find the el7 builds in &lt;a href=&quot;https://build.whamcloud.com/job/lustre-reviews/60456/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-reviews/60456/&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="238086" author="cmcl" created="Thu, 6 Dec 2018 10:25:58 +0000"  >&lt;p&gt;Thanks Jian. I still have to add a patch for a kernel panic issue (&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11692&quot; title=&quot;lustre kernel panic -  (niobuf.c:330:ptlrpc_register_bulk()) LBUG&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11692&quot;&gt;&lt;del&gt;LU-11692&lt;/del&gt;&lt;/a&gt;), so might grab the src rpm for 2.10.5 and try to patch that.&lt;/p&gt;

&lt;p&gt;-Campbell&lt;/p&gt;</comment>
                            <comment id="238087" author="cmcl" created="Thu, 6 Dec 2018 10:48:17 +0000"  >&lt;p&gt;2.10.5 fails to build. Should I send the build log?&lt;/p&gt;</comment>
                            <comment id="238091" author="adilger" created="Thu, 6 Dec 2018 12:23:18 +0000"  >&lt;p&gt;Campbell, I&apos;m not sure what build problem you are seeing (we build this branch daily), but I&apos;ve cherry-picked the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11692&quot; title=&quot;lustre kernel panic -  (niobuf.c:330:ptlrpc_register_bulk()) LBUG&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11692&quot;&gt;&lt;del&gt;LU-11692&lt;/del&gt;&lt;/a&gt; patch on top of 33130.  It looks like the builders are a bit backed up, but there should be a link to a build reported in &lt;a href=&quot;https://review.whamcloud.com/33798&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33798&lt;/a&gt; in a couple of hours.  Feel free to attach your build logs here, in case it is a trivial problem to fix.&lt;/p&gt;</comment>
                            <comment id="238093" author="cmcl" created="Thu, 6 Dec 2018 13:52:46 +0000"  >&lt;p&gt;Hi Andreas,&lt;/p&gt;

&lt;p&gt;I&apos;m doing something wrong here, I cloned git://git.whamcloud.com/fs/lustre-release.git and checked out the b2_10 branch, but the files are unpatched and I&apos;m not quite sure how to add that patch via git. I can&apos;t find it to cherry-pick it. Or can I just add the patches manually via diff and patch? I was doing it this way before but the build fails (whereas an unpatched tree compiles fine).&#160;Sorry for my ignorance here.&lt;/p&gt;

&lt;p&gt;regards,&lt;/p&gt;

&lt;p&gt;Campbell&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="238106" author="yujian" created="Thu, 6 Dec 2018 18:37:36 +0000"  >&lt;p&gt;Hi Campbell,&lt;br/&gt;
Build &lt;a href=&quot;https://build.whamcloud.com/job/lustre-reviews/60480/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://build.whamcloud.com/job/lustre-reviews/60480/&lt;/a&gt; in &lt;a href=&quot;https://review.whamcloud.com/33798&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33798&lt;/a&gt; is ready. It contains both the patches for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11693&quot; title=&quot;Soft lockups on Lustre clients&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11693&quot;&gt;LU-11693&lt;/a&gt;/&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-9230&quot; title=&quot;soft lockup on v2.9 Lustre clients (ldlm?)&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-9230&quot;&gt;&lt;del&gt;LU-9230&lt;/del&gt;&lt;/a&gt; and &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11692&quot; title=&quot;lustre kernel panic -  (niobuf.c:330:ptlrpc_register_bulk()) LBUG&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11692&quot;&gt;&lt;del&gt;LU-11692&lt;/del&gt;&lt;/a&gt;/&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11647&quot; title=&quot;niobuf.c:330:ptlrpc_register_bulk()) ASSERTION( desc-&amp;gt;bd_md_count == 0 ) failed:&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11647&quot;&gt;&lt;del&gt;LU-11647&lt;/del&gt;&lt;/a&gt; applied on the tip of Lustre b2_10 branch (tag 2.10.6-RC3).&lt;/p&gt;</comment>
                            <comment id="238141" author="adilger" created="Fri, 7 Dec 2018 01:16:42 +0000"  >&lt;p&gt;Campbell, what process are you using to build, and what files are &quot;unpatched&quot;?  I&apos;d recommend to follow e.g. &lt;a href=&quot;https://wiki.whamcloud.com/pages/viewpage.action?pageId=52104622&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://wiki.whamcloud.com/pages/viewpage.action?pageId=52104622&lt;/a&gt; or &lt;a href=&quot;http://wiki.lustre.org/Compiling_Lustre&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://wiki.lustre.org/Compiling_Lustre&lt;/a&gt; if you&apos;ve never done this before.  At its simplest, doing &quot;&lt;tt&gt;sh autogen.sh; ./configure; make rpms&lt;/tt&gt;&quot; is all that is needed, once you have the kernel source RPMs but it can become more complex if you are using OFED, ZFS, etc.&lt;/p&gt;

&lt;p&gt;As Jian wrote, it is a lot easier to use a pre-built package if that has the features you need.&lt;/p&gt;</comment>
                            <comment id="238154" author="cmcl" created="Fri, 7 Dec 2018 10:25:08 +0000"  >&lt;p&gt;Hi Andreas,&lt;/p&gt;

&lt;p&gt;I cloned the lustre repo and then checked the b2_10 branch. I then ran an autogen, copied the spec file to my rpmbuild tree and tarred the source up and copied it to rpmbuild/SOURCES. I was expecting the b2_10 to already be patched but a comparison showed it hadn&apos;t been. I created a patch file from a recursive diff and then modify the spec file to apply that patch. I then built a source rpm and tried an rpm rebuild. I was getting build errors, e.g.,&#160;&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
 /u/cmcl/rpmbuild/BUILD/lustre-2.10.2/lustre/include/lustre_lib.h:357:9: error: implicit declaration of function &lt;span class=&quot;code-quote&quot;&gt;&apos;is_bl_done&apos;&lt;/span&gt; [-Werror=implicit-function-declaration]
 struct l_wait_info *__info = (info); \
 ^
/u/cmcl/rpmbuild/BUILD/lustre-2.10.2/lustre/ptlrpc/../../lustre/ldlm/ldlm_lock.c:2330:3: note: in expansion of macro &lt;span class=&quot;code-quote&quot;&gt;&apos;l_wait_event&apos;&lt;/span&gt;
 l_wait_event(lock-&amp;gt;l_waitq, is_bl_done(lock), &amp;amp;lwi)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I&apos;m doing something wrong and/or in an overly complicated way. I thought the b2_10 branch would have already been patched.&lt;br/&gt;
I&apos;d seen the whamcloud wiki page you&apos;d mentioned but thought that was for server rather than client. The wiki.lustre.org I hadn&apos;t seen.&lt;br/&gt;
Anyway, I found a build on &lt;a href=&quot;https://review.whamcloud.com/33798&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33798&lt;/a&gt; linked by Jian which has the patches in it, so I&apos;ll build from that. Sorry for wasting your time with this but hopefully I&apos;ll be on the right track from here on in.&lt;/p&gt;

&lt;p&gt;Cheers,&lt;/p&gt;

&lt;p&gt;Campbell&lt;/p&gt;</comment>
                            <comment id="238159" author="pjones" created="Fri, 7 Dec 2018 14:03:57 +0000"  >&lt;p&gt;Glad to hear that you&apos;ve got this sorted out. Let us know whether the fix works as expected.&lt;/p&gt;</comment>
                            <comment id="238166" author="cmcl" created="Fri, 7 Dec 2018 15:33:08 +0000"  >&lt;p&gt;I&apos;ve built the rpms fine but I have another question: the client has the lustre kernel package installed (I am told it was installed as the lustre kernel has better performance than a vanilla kernel), which provides the fs and net kernel modules. The kmod-lustre-client package provides the kernel modules, though it installs them in /lib/modules/`uname -r`/extra/lustre-client rather than /lib/modules/`uname -r`/extra/lustre. Will this cause any kind of issue if both are installed, or is it better to install e.g., a vanilla kernel and rebuild the packages against this?&lt;/p&gt;

&lt;p&gt;Thanks,&lt;/p&gt;

&lt;p&gt;Campbell&lt;/p&gt;</comment>
                            <comment id="238176" author="yujian" created="Fri, 7 Dec 2018 17:47:05 +0000"  >&lt;p&gt;Hi Campbell,&lt;br/&gt;
Lustre client is patchless, which means while building Lustre codes for client, we do not need to patch Linux vendor or vanilla kernel. All of the regression testings were performed on patchless Lustre clients, so we suggest to use vendor kernel.&lt;/p&gt;</comment>
                            <comment id="238177" author="pjones" created="Fri, 7 Dec 2018 17:59:53 +0000"  >&lt;p&gt;Campbell&lt;/p&gt;

&lt;p&gt;Even the servers only need to be patched if you are using the project quotas feature. The patches that gave performance improvements in past versions have now been upstreamed and many customers prefer the simplified admin over project quotas...&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="243009" author="cmcl" created="Thu, 28 Feb 2019 10:44:32 +0000"  >&lt;p&gt;Just some feedback: got some soft lockups on one of our clients, though it only happened once however. The other clients have been fine.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                            <outwardlinks description="duplicates">
                                        <issuelink>
            <issuekey id="53341">LU-11391</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="44868">LU-9230</issuekey>
        </issuelink>
                            </outwardlinks>
                                                        </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="31577" name="build.log" size="38396" author="cmcl" created="Wed, 5 Dec 2018 18:40:26 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|i006sf:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>