<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 02:40:50 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-11089] Performance improvements for lu_object locking</title>
                <link>https://jira.whamcloud.com/browse/LU-11089</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;While porting the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6800&quot; title=&quot;Significant performance regression with patch LU-5264&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6800&quot;&gt;&lt;del&gt;LU-6800&lt;/del&gt;&lt;/a&gt; work upstream the reaction to the approach was disliked since it wasn&apos;t a real improvement. Neil has created a patch series to break up the global lock to increase its performance.&lt;/p&gt;</description>
                <environment></environment>
        <key id="52559">LU-11089</key>
            <summary>Performance improvements for lu_object locking</summary>
                <type id="4" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11310&amp;avatarType=issuetype">Improvement</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="simmonsja">James A Simmons</assignee>
                                    <reporter username="simmonsja">James A Simmons</reporter>
                        <labels>
                    </labels>
                <created>Wed, 13 Jun 2018 17:02:30 +0000</created>
                <updated>Tue, 11 Aug 2020 14:14:14 +0000</updated>
                            <resolved>Thu, 18 Jul 2019 19:09:08 +0000</resolved>
                                    <version>Lustre 2.12.0</version>
                                    <fixVersion>Lustre 2.13.0</fixVersion>
                    <fixVersion>Lustre 2.12.5</fixVersion>
                                        <due></due>
                            <votes>1</votes>
                                    <watches>12</watches>
                                                                            <comments>
                            <comment id="229519" author="gerrit" created="Wed, 13 Jun 2018 19:50:35 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/32711&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32711&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obdclass: make key_set_version an atomic_t&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 2da1e82923e31c017592353a79e52c8ddad9348f&lt;/p&gt;</comment>
                            <comment id="229520" author="gerrit" created="Wed, 13 Jun 2018 20:17:45 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/32712&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32712&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obdclass: use an rwsem instead of lu_key_initing_cnt.&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 8d698149c0170224e4fdb0cc4b13a5e7190f742a&lt;/p&gt;</comment>
                            <comment id="229521" author="gerrit" created="Wed, 13 Jun 2018 20:20:00 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/32713&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32713&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obdclass: remove locking from lu_context_exit()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 872ea28d4961209f74b827805a749a33407bb9b7&lt;/p&gt;</comment>
                            <comment id="231902" author="simmonsja" created="Tue, 14 Aug 2018 02:10:31 +0000"  >&lt;p&gt;Here are some performance numbers with the 3 patches posted so far for this work. Two more patches are needed to complete this work.&lt;/p&gt;

&lt;p&gt;Without patches:&lt;/p&gt;

&lt;p&gt;mdtest-1.9.4-rc was launched with 5 total task(s) on 5 node(s)&lt;/p&gt;

&lt;p&gt;Command line used: /lustre/crius/jsimmons/x86_64/mdtest -n 1000 -i 5 -z 2 -d /lustre/crius/jsimmons/performance_md_test&lt;/p&gt;

&lt;p&gt;Path: /lustre/crius/jsimmons&lt;/p&gt;

&lt;p&gt;FS: 100.2 TiB &#160; Used FS: 0.0% &#160; Inodes: 8.0 Mi &#160; Used Inodes: 0.0%&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;5 tasks, 4995 files/directories&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;SUMMARY: (of 5 iterations)&lt;/p&gt;

&lt;p&gt;&#160;&#160; Operation&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; Max&#160; &#160; &#160; &#160; &#160; &#160; Min &#160; &#160; &#160; &#160; &#160; Mean&#160; &#160; &#160; &#160; Std Dev&lt;/p&gt;

&lt;p&gt;&#160;&#160; ---------&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; ---&#160; &#160; &#160; &#160; &#160; &#160; &amp;#8212; &#160; &#160; &#160; &#160; &#160; ----&#160; &#160; &#160; &#160; -------&lt;/p&gt;

&lt;p&gt;&#160;&#160; Directory creation:&#160; &#160; &#160; 15427.405&#160; &#160; &#160; 12699.715&#160; &#160; &#160; 14055.058&#160; &#160; &#160; &#160; 990.423&lt;/p&gt;

&lt;p&gt;&#160;&#160; Directory stat&#160; &#160; :&#160; &#160; &#160; 25565.025&#160; &#160; &#160; 21514.805&#160; &#160; &#160; 24128.395 &#160; &#160; &#160; 1750.604&lt;/p&gt;

&lt;p&gt;&#160;&#160; Directory removal :&#160; &#160; &#160; 16948.667&#160; &#160; &#160; 13410.061&#160; &#160; &#160; 15774.485 &#160; &#160; &#160; 1439.361&lt;/p&gt;

&lt;p&gt;&#160;&#160; File creation &#160; &#160; : &#160; &#160; &#160; 5982.378 &#160; &#160; &#160; 4995.855 &#160; &#160; &#160; 5361.390&#160; &#160; &#160; &#160; 375.919&lt;/p&gt;

&lt;p&gt;&#160;&#160; File stat &#160; &#160; &#160; &#160; :&#160; &#160; &#160; 10494.583 &#160; &#160; &#160; 9369.004&#160; &#160; &#160; 10041.334&#160; &#160; &#160; &#160; 408.314&lt;/p&gt;

&lt;p&gt;&#160;&#160; File read &#160; &#160; &#160; &#160; : &#160; &#160; &#160; 7705.990 &#160; &#160; &#160; 6695.037 &#160; &#160; &#160; 7290.709&#160; &#160; &#160; &#160; 434.290&lt;/p&gt;

&lt;p&gt;&#160;&#160; File removal&#160; &#160; &#160; : &#160; &#160; &#160; 8118.476 &#160; &#160; &#160; 7387.675 &#160; &#160; &#160; 7833.091&#160; &#160; &#160; &#160; 262.636&lt;/p&gt;

&lt;p&gt;&#160;&#160; Tree creation &#160; &#160; : &#160; &#160; &#160; 2031.828 &#160; &#160; &#160; 1576.483 &#160; &#160; &#160; 1891.981&#160; &#160; &#160; &#160; 163.704&lt;/p&gt;

&lt;p&gt;&#160;&#160; Tree removal&#160; &#160; &#160; : &#160; &#160; &#160; 1221.602&#160; &#160; &#160; &#160; 952.344 &#160; &#160; &#160; 1119.629 &#160; &#160; &#160; &#160; 94.340&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&amp;#8211; finished at 08/13/2018 19:14:55 &amp;#8211;&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;*******************************************************************************************&lt;/p&gt;

&lt;p&gt;With the 3 patches:&lt;/p&gt;

&lt;p&gt;mdtest-1.9.4-rc was launched with 5 total task(s) on 5 node(s)&lt;/p&gt;

&lt;p&gt;Command line used: /lustre/crius/x86_64/mdtest -n 1000 -i 5 -z 2 -d /lustre/crius/performance_md_test&lt;/p&gt;

&lt;p&gt;Path: /lustre/crius&lt;/p&gt;

&lt;p&gt;FS: 100.2 TiB &#160; Used FS: 0.0% &#160; Inodes: 8.0 Mi &#160; Used Inodes: 0.0%&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;5 tasks, 4995 files/directories&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;SUMMARY: (of 5 iterations)&lt;/p&gt;

&lt;p&gt;&#160;&#160; Operation&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; Max&#160; &#160; &#160; &#160; &#160; &#160; Min &#160; &#160; &#160; &#160; &#160; Mean&#160; &#160; &#160; &#160; Std Dev&lt;/p&gt;

&lt;p&gt;&#160;&#160; ---------&#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; &#160; ---&#160; &#160; &#160; &#160; &#160; &#160; &amp;#8212; &#160; &#160; &#160; &#160; &#160; ----&#160; &#160; &#160; &#160; -------&lt;/p&gt;

&lt;p&gt;&#160;&#160; Directory creation:&#160; &#160; &#160; 17621.888&#160; &#160; &#160; 13372.852&#160; &#160; &#160; 15968.954 &#160; &#160; &#160; 1441.216&lt;/p&gt;

&lt;p&gt;&#160;&#160; Directory stat&#160; &#160; :&#160; &#160; &#160; 29448.160&#160; &#160; &#160; 24189.123&#160; &#160; &#160; 27233.240 &#160; &#160; &#160; 1811.668&lt;/p&gt;

&lt;p&gt;&#160;&#160; Directory removal :&#160; &#160; &#160; 20349.080&#160; &#160; &#160; 16581.538&#160; &#160; &#160; 18883.208 &#160; &#160; &#160; 1315.397&lt;/p&gt;

&lt;p&gt;&#160;&#160; File creation &#160; &#160; : &#160; &#160; &#160; 6240.638 &#160; &#160; &#160; 5677.361 &#160; &#160; &#160; 5930.478&#160; &#160; &#160; &#160; 201.596&lt;/p&gt;

&lt;p&gt;&#160;&#160; File stat &#160; &#160; &#160; &#160; :&#160; &#160; &#160; 10785.819&#160; &#160; &#160; 10541.888&#160; &#160; &#160; 10701.592 &#160; &#160; &#160; &#160; 85.094&lt;/p&gt;

&lt;p&gt;&#160;&#160; File read &#160; &#160; &#160; &#160; : &#160; &#160; &#160; 7550.051 &#160; &#160; &#160; 6797.333 &#160; &#160; &#160; 7383.661&#160; &#160; &#160; &#160; 293.526&lt;/p&gt;

&lt;p&gt;&#160;&#160; File removal&#160; &#160; &#160; : &#160; &#160; &#160; 9781.788 &#160; &#160; &#160; 8219.130 &#160; &#160; &#160; 8877.036&#160; &#160; &#160; &#160; 522.711&lt;/p&gt;

&lt;p&gt;&#160;&#160; Tree creation &#160; &#160; : &#160; &#160; &#160; 2150.501 &#160; &#160; &#160; 1322.451 &#160; &#160; &#160; 1820.234&#160; &#160; &#160; &#160; 279.086&lt;/p&gt;

&lt;p&gt;&#160;&#160; Tree removal&#160; &#160; &#160; : &#160; &#160; &#160; 1308.718&#160; &#160; &#160; &#160; 939.562 &#160; &#160; &#160; 1115.832&#160; &#160; &#160; &#160; 151.934&lt;/p&gt;

&lt;p&gt;&#160;&lt;/p&gt;

&lt;p&gt;&amp;#8211; finished at 08/13/2018 20:10:34 &amp;#8211;&lt;/p&gt;</comment>
                            <comment id="234554" author="sihara" created="Mon, 8 Oct 2018 06:08:27 +0000"  >&lt;p&gt;I&apos;m getting the following crash on servers. (both OSS and MDS). I&apos;m still not sure this crash comes form patch of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; , but at least, getting crash after applied patch. so, might be related... &lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[74844.146432] BUG: unable to handle kernel NULL pointer dereference at 0000000000000010
[74844.157577] IP: [&amp;lt;ffffffffc0b75aed&amp;gt;] nid_hash+0x2d/0x50 [obdclass]
[74844.167059] PGD 0 
[74844.172253] Oops: 0000 [#1] SMP 
[74844.178646] Modules linked in: osp(OE) mdd(OE) lod(OE) mdt(OE) lfsck(OE) mgc(OE) osd_ldiskfs(OE) lquota(OE) ldiskfs(OE) ksocklnd(OE) lustre(OE) lmv(OE) mdc(OE) osc(OE) lov(OE) fid(OE) fld(OE) ko2iblnd(OE) ptlrpc(OE) obdclass(OE) lnet(OE) libcfs(OE) rpcsec_gss_krb5 nfsv4 dns_resolver nfs fscache dell_rbu ib_srp(OE) scsi_transport_srp(OE) rdma_ucm(OE) ib_ucm(OE) rdma_cm(OE) iw_cm(OE) ib_ipoib(OE) ib_cm(OE) ib_uverbs(OE) ib_umad(OE) mlx5_fpga_tools(OE) mlx5_ib(OE) mlx5_core(OE) mlxfw(OE) mlx4_en(OE) skx_edac edac_core intel_powerclamp coretemp intel_rapl iosf_mbi kvm_intel kvm irqbypass dm_round_robin crc32_pclmul ghash_clmulni_intel dm_service_time aesni_intel lrw gf128mul glue_helper ablk_helper cryptd joydev iTCO_wdt iTCO_vendor_support pcspkr ipmi_si mei_me mei nfit lpc_ich ipmi_devintf acpi_power_meter
[74844.270643]  i2c_i801 acpi_cpufreq acpi_pad libnvdimm shpchp ipmi_msghandler wmi nfsd auth_rpcgss nfs_acl lockd knem(OE) dm_multipath grace sunrpc ip_tables ext4 mbcache jbd2 mlx4_ib(OE) ib_core(OE) sd_mod crc_t10dif crct10dif_generic ast i2c_algo_bit drm_kms_helper qla2xxx syscopyarea sysfillrect sysimgblt fb_sys_fops ttm crct10dif_pclmul crct10dif_common crc32c_intel ahci i40e drm libahci libata mlx4_core(OE) devlink scsi_transport_fc ptp mlx_compat(OE) pps_core i2c_core scsi_tgt dm_mirror dm_region_hash dm_log dm_mod sg [last unloaded: libcfs]
[74844.334968] CPU: 34 PID: 321939 Comm: mdt05_002 Tainted: G           OE  ------------   3.10.0-693.21.1.el7_lustre.ddn1.x86_64 #1
[74844.352809] Hardware name: Supermicro SYS-5019P-WT/X11SPW-TF, BIOS 1.0 06/06/2017
[74844.363379] task: ffff88173113af70 ti: ffff88176cef0000 task.ti: ffff88176cef0000
[74844.373918] RIP: 0010:[&amp;lt;ffffffffc0b75aed&amp;gt;]  [&amp;lt;ffffffffc0b75aed&amp;gt;] nid_hash+0x2d/0x50 [obdclass]
[74844.385637] RSP: 0018:ffff88176cef3b40  EFLAGS: 00010206
[74844.393941] RAX: 000000000002b5a5 RBX: ffff8801d5ae1080 RCX: 0000000000000001
[74844.404043] RDX: 000000000000007f RSI: 0000000000000010 RDI: 000000000002a0a0
[74844.414099] RBP: ffff88176cef3b68 R08: 0000000000000000 R09: ffffffffc0dc02d1
[74844.424113] R10: ffff8817da29b960 R11: ffff8817277c9400 R12: 0000000000000007
[74844.434089] R13: ffff88176cef3b88 R14: ffff8817d138fa40 R15: ffff8801deae1038
[74844.444021] FS:  0000000000000000(0000) GS:ffff8817da280000(0000) knlGS:0000000000000000
[74844.454889] CS:  0010 DS: 0000 ES: 0000 CR0: 0000000080050033
[74844.463390] CR2: 0000000000000010 CR3: 0000000001a02000 CR4: 00000000003607e0
[74844.473242] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
[74844.483049] DR3: 0000000000000000 DR6: 00000000fffe0ff0 DR7: 0000000000000400
[74844.492804] Call Trace:
[74844.497826]  [&amp;lt;ffffffffc0913388&amp;gt;] ? cfs_hash_bd_from_key+0x38/0xb0 [libcfs]
[74844.507416]  [&amp;lt;ffffffffc0913425&amp;gt;] cfs_hash_bd_get+0x25/0x70 [libcfs]
[74844.516384]  [&amp;lt;ffffffffc09166d2&amp;gt;] cfs_hash_add+0x52/0x1a0 [libcfs]
[74844.525211]  [&amp;lt;ffffffffc0d8a765&amp;gt;] target_handle_connect+0x1fe5/0x29b0 [ptlrpc]
[74844.535080]  [&amp;lt;ffffffffc0e2e93a&amp;gt;] tgt_request_handle+0x50a/0x1580 [ptlrpc]
[74844.544540]  [&amp;lt;ffffffffc0e0aa41&amp;gt;] ? ptlrpc_nrs_req_get_nolock0+0xd1/0x170 [ptlrpc]
[74844.554587]  [&amp;lt;ffffffff810ee42f&amp;gt;] ? __getnstimeofday64+0x3f/0xd0
[74844.563088]  [&amp;lt;ffffffffc0dd5b6b&amp;gt;] ptlrpc_server_handle_request+0x24b/0xab0 [ptlrpc]
[74844.573214]  [&amp;lt;ffffffffc0dd29f5&amp;gt;] ? ptlrpc_wait_event+0xa5/0x360 [ptlrpc]
[74844.582360]  [&amp;lt;ffffffff810c7c82&amp;gt;] ? default_wake_function+0x12/0x20
[74844.590949]  [&amp;lt;ffffffff810bdc4b&amp;gt;] ? __wake_up_common+0x5b/0x90
[74844.599113]  [&amp;lt;ffffffffc0dd9384&amp;gt;] ptlrpc_main+0xaf4/0x1fa0 [ptlrpc]
[74844.607705]  [&amp;lt;ffffffffc0dd8890&amp;gt;] ? ptlrpc_register_service+0xe90/0xe90 [ptlrpc]
[74844.617338]  [&amp;lt;ffffffff810b4031&amp;gt;] kthread+0xd1/0xe0
[74844.624400]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
[74844.632668]  [&amp;lt;ffffffff816c0577&amp;gt;] ret_from_fork+0x77/0xb0
[74844.640212]  [&amp;lt;ffffffff810b3f60&amp;gt;] ? insert_kthread_work+0x40/0x40
[74844.648439] Code: 44 00 00 48 85 f6 74 37 b9 01 00 00 00 45 31 c0 b8 05 15 00 00 eb 0d 0f 1f 80 00 00 00 00 49 89 c8 48 89 f9 89 c7 c1 e7 05 01 f8 &amp;lt;42&amp;gt; 0f be 3c 06 01 f8 48 8d 79 01 48 83 ff 09 75 e2 21 d0 c3 55 
[74844.673703] RIP  [&amp;lt;ffffffffc0b75aed&amp;gt;] nid_hash+0x2d/0x50 [obdclass]
[74844.682236]  RSP &amp;lt;ffff88176cef3b40&amp;gt;
[74844.687869] CR2: 0000000000000010
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;
&lt;p&gt;&#160;&lt;/p&gt;</comment>
                            <comment id="234573" author="simmonsja" created="Mon, 8 Oct 2018 16:32:44 +0000"  >&lt;p&gt;What triggers this crash? One of the maloo test or does running a particular application cause this? Also are you using all the posted LU-100189 patches?&lt;/p&gt;</comment>
                            <comment id="234939" author="ruth.klundt@gmail.com" created="Mon, 15 Oct 2018 19:04:46 +0000"  >&lt;p&gt;hi james,&lt;/p&gt;

&lt;p&gt;I&apos;ve seen that too, just once on an OSS. I had done an abort_recovery on the mdt, and was mounting ~130 2.8 clients. got impatient I guess.&lt;/p&gt;

&lt;p&gt;Servers x86 built at commit 4e42995.&lt;/p&gt;</comment>
                            <comment id="234942" author="simmonsja" created="Mon, 15 Oct 2018 20:29:23 +0000"  >&lt;p&gt;Thanks Ruth for the info. Is this with these patches applied or did it happen independently? Hmmm. I suspect&#160; a bug is buried in the NID hash code. Anyways I was planning to port it to rhashtable handling since that scales better and rhashtable is a standard in the linux kernel. Ruth can you reproduce it every time or was this a once off?&lt;/p&gt;</comment>
                            <comment id="234943" author="ruth.klundt@gmail.com" created="Mon, 15 Oct 2018 20:32:21 +0000"  >&lt;p&gt;One off with no patches applied.&lt;/p&gt;

&lt;p&gt;After I brought the node back all the clients mounted and tests ran.&lt;/p&gt;</comment>
                            <comment id="234953" author="sihara" created="Mon, 15 Oct 2018 22:30:50 +0000"  >&lt;p&gt;This happens quite offten. I saw crash even at intial mount. e.g. create filesystem and mount Lustre on 32 clients, then got crash of one of OSS.&lt;/p&gt;</comment>
                            <comment id="235365" author="simmonsja" created="Tue, 23 Oct 2018 15:45:10 +0000"  >&lt;p&gt;Thanks for the info. Ruth has pointed out that this is a general bug. I have started the port of the nid hash to rhashtable and I&apos;m seeing hidden issues with the original code.&lt;/p&gt;</comment>
                            <comment id="235946" author="simmonsja" created="Tue, 30 Oct 2018 20:15:55 +0000"  >&lt;p&gt;Since the NID hash seems to be broken in general I did a port to rhashtables. Still need to work on the /proc entries to display hash stats. Please try it out to see if no longer crashes your nodes. Patch is at:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;https://review.whamcloud.com/#/c/33518&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/#/c/33518&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;The build breakage is only on SLES12SP3.&lt;/p&gt;</comment>
                            <comment id="236080" author="paf" created="Wed, 31 Oct 2018 21:08:17 +0000"  >&lt;p&gt;Seen here during recovery as well.&#160; Interesting.&#160; I imagine even if the bug was already there, the changes made it easier to hit.&#160; (Doesn&apos;t mean the changes are wrong, just that there&apos;s probably a reason we&apos;re suddenly seeing it.)&lt;/p&gt;</comment>
                            <comment id="236150" author="paf" created="Thu, 1 Nov 2018 15:42:00 +0000"  >&lt;p&gt;Ah, I see now that none of the patches have landed.&#160; So it is definitely a pre-existing bug.&#160; Interesting.&lt;/p&gt;</comment>
                            <comment id="236236" author="pjones" created="Fri, 2 Nov 2018 14:01:07 +0000"  >&lt;p&gt;Could we please have a separate ticket for any instances seen on 2.12 or earlier releases without James&apos;s unlanded patches being applied? Is there any suggestion that this is happening more frequently on 2.12 compared to 2.11 and earlier releases?&lt;/p&gt;</comment>
                            <comment id="236365" author="sihara" created="Tue, 6 Nov 2018 00:47:24 +0000"  >&lt;p&gt;James, crashing servers were not related to your patches (&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt;), but looks like more general problem in master. me open new jira ticket for this.&lt;/p&gt;</comment>
                            <comment id="236366" author="simmonsja" created="Tue, 6 Nov 2018 00:50:28 +0000"  >&lt;p&gt;Thanks. I have a patch based on &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-8130&quot; title=&quot;Migrate from libcfs hash to rhashtable&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-8130&quot;&gt;LU-8130&lt;/a&gt; work that should fix this.&lt;/p&gt;</comment>
                            <comment id="236441" author="paf" created="Tue, 6 Nov 2018 16:21:19 +0000"  >&lt;p&gt;Ihara,&lt;/p&gt;

&lt;p&gt;Could you link that ticket here?&#160; I&apos;m interested in tracking it.&#160; Our MDSses running 2.12 are crashing when we fail them over under load.&#160; Pretty reliably. &lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/sad.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/p&gt;</comment>
                            <comment id="236442" author="sihara" created="Tue, 6 Nov 2018 16:32:47 +0000"  >&lt;p&gt;Patrick, sorry! forgot to update this ticket. Here is new ticket. &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11624&quot; title=&quot; BUG: unable to handle kernel NULL pointer at nid_hash()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11624&quot;&gt;&lt;del&gt;LU-11624&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;</comment>
                            <comment id="237052" author="gerrit" created="Thu, 15 Nov 2018 19:27:28 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/33667&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33667&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: use wait_event_var() in lu_context_key_degister()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 37bb534e3779c4cfcf46a0206583ce3a88be69d1&lt;/p&gt;</comment>
                            <comment id="237053" author="gerrit" created="Thu, 15 Nov 2018 19:32:11 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/33668&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33668&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: remove lock from key register/degister&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 837c5d44d10daf04353e900939d9977feed064c5&lt;/p&gt;</comment>
                            <comment id="237098" author="gerrit" created="Fri, 16 Nov 2018 16:37:40 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/33673&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33673&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: rename lu_keys_guard to lu_context_remembered_guard&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 0c790df73f57138e554326d95566de04618c1e93&lt;/p&gt;</comment>
                            <comment id="237099" author="gerrit" created="Fri, 16 Nov 2018 16:39:45 +0000"  >&lt;p&gt;James Simmons (uja.ornl@yahoo.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/33674&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33674&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; lu_object: fix possible hang waiting for LCS_LEAVING&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 28bd00dbcada616bcb5cf14899c3feac784bc6c1&lt;/p&gt;</comment>
                            <comment id="237110" author="simmonsja" created="Fri, 16 Nov 2018 19:33:12 +0000"  >&lt;p&gt;Sigh, RHEL 7.6 did a port wrong from upstream &lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/sad.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&#160;Need to download RHEL kernel source and see how they botched the port.&lt;/p&gt;</comment>
                            <comment id="242880" author="gerrit" created="Wed, 27 Feb 2019 02:00:50 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/32711/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32711/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obdclass: make key_set_version an atomic_t&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: e9213217691ae78d15237b0c5ecd3ba0b0416652&lt;/p&gt;</comment>
                            <comment id="242881" author="gerrit" created="Wed, 27 Feb 2019 02:01:00 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/32712/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32712/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obdclass: use an rwsem instead of lu_key_initing_cnt.&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 99bb9f91f5c5ca6a380b22efa04a3c00c8f520ca&lt;/p&gt;</comment>
                            <comment id="247415" author="gerrit" created="Tue, 21 May 2019 05:10:54 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/32713/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/32713/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obdclass: remove locking from lu_context_exit()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 62f6496f81ff5896ecc778c9e57b6f84d0f83da9&lt;/p&gt;</comment>
                            <comment id="248172" author="gerrit" created="Sat, 1 Jun 2019 03:55:50 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/33667/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33667/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: use wait_event_var() in lu_context_key_degister()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: 372ef85512dd2a722415fba9a3df66f81029508b&lt;/p&gt;</comment>
                            <comment id="248173" author="gerrit" created="Sat, 1 Jun 2019 03:57:56 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/33668/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33668/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: remove lock from key register/degister&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: f0b78533f07ca6d766f1ea97a623cdd6ff063e0f&lt;/p&gt;</comment>
                            <comment id="249528" author="gerrit" created="Thu, 20 Jun 2019 03:51:19 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/33673/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/33673/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: rename lu_keys_guard to lu_context_remembered_guard&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: bf86b80e4eacd0734665aa818d9cdebf0c157ee1&lt;/p&gt;</comment>
                            <comment id="249532" author="simmonsja" created="Thu, 20 Jun 2019 03:53:05 +0000"  >&lt;p&gt;Last patch landed.&lt;/p&gt;</comment>
                            <comment id="269896" author="gerrit" created="Tue, 12 May 2020 00:59:45 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/38570&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38570&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: use wait_event_var() in lu_context_key_degister()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 5df1c23bd60c193ae8e396840d58c7d7e532568e&lt;/p&gt;</comment>
                            <comment id="269906" author="gerrit" created="Tue, 12 May 2020 05:16:43 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) uploaded a new patch: &lt;a href=&quot;https://review.whamcloud.com/38573&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38573&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: use wait_event_var() in lu_context_key_degister()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: a69b6a8f4f1de86ce247620315877a8050e102f8&lt;/p&gt;</comment>
                            <comment id="270812" author="gerrit" created="Thu, 21 May 2020 06:08:01 +0000"  >&lt;p&gt;Oleg Drokin (green@whamcloud.com) merged in patch &lt;a href=&quot;https://review.whamcloud.com/38573/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://review.whamcloud.com/38573/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-11089&quot; title=&quot;Performance improvements for lu_object locking&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-11089&quot;&gt;&lt;del&gt;LU-11089&lt;/del&gt;&lt;/a&gt; obd: use wait_event_var() in lu_context_key_degister()&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: b2_12&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: ceb45b5fbe35a65539b76678d8187a902504b138&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="30925">LU-6800</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="46758">LU-9679</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="37888">LU-8346</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="56445">LU-12565</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzzyc7:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>9223372036854775807</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                                                                                </customfields>
    </item>
</channel>
</rss>