<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:43:16 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-4499] NRS ORR cfs_hash_find_or_add() LBUG</title>
                <link>https://jira.whamcloud.com/browse/LU-4499</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Hit LBUG and crach on OSS during IOR SSF(Single shared file) test with striping setting on all OSTs(lfs setstripe -c -1).&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;&amp;lt;0&amp;gt;LustreError: 28757:0:(hash.c:1252:cfs_hash_find_or_add()) ASSERTION( hlist_unhashed(hnode) ) failed: 
&amp;lt;0&amp;gt;LustreError: 28757:0:(hash.c:1252:cfs_hash_find_or_add()) LBUG
&amp;lt;0&amp;gt;Kernel panic - not syncing: LBUG in interrupt.
&amp;lt;0&amp;gt;
&amp;lt;4&amp;gt;Pid: 28757, comm: ll_ost01_008 Not tainted 2.6.32-358.23.2.el6_lustre.ge975b1c.x86_64 #1
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8150deec&amp;gt;] ? panic+0xa7/0x16f
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa065aedd&amp;gt;] ? lbug_with_loc+0x8d/0xb0 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0672d80&amp;gt;] ? cfs_hash_findadd_unique+0x0/0x30 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0672d98&amp;gt;] ? cfs_hash_findadd_unique+0x18/0x30 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c83c76&amp;gt;] ? nrs_orr_res_get+0x696/0xb90 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff81055ad3&amp;gt;] ? __wake_up+0x53/0x70
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c79e36&amp;gt;] ? nrs_resource_get+0x56/0x110 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c37d95&amp;gt;] ? lustre_msg_buf+0x55/0x60 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c7a7fb&amp;gt;] ? nrs_resource_get_safe+0x8b/0x100 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c7ce38&amp;gt;] ? ptlrpc_nrs_req_hp_move+0x68/0x210 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c5f845&amp;gt;] ? req_capsule_client_get+0x15/0x20 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c1a158&amp;gt;] ? ldlm_server_blocking_ast+0x228/0x880 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c8f65b&amp;gt;] ? tgt_blocking_ast+0x7b/0x5e0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0beb1ba&amp;gt;] ? ldlm_add_bl_work_item+0x8a/0x1e0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0bee405&amp;gt;] ? ldlm_add_ast_work_item+0x55/0x180 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0bed38d&amp;gt;] ? ldlm_work_bl_ast_lock+0xdd/0x290 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c2e3bc&amp;gt;] ? ptlrpc_set_wait+0x6c/0x860 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff811685ac&amp;gt;] ? __kmalloc+0x20c/0x220
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c2b06a&amp;gt;] ? ptlrpc_prep_set+0xfa/0x2f0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0bed2b0&amp;gt;] ? ldlm_work_bl_ast_lock+0x0/0x290 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0bf006b&amp;gt;] ? ldlm_run_ast_work+0x1bb/0x470 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c070ad&amp;gt;] ? ldlm_process_extent_lock+0x13d/0xa90 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0bef5ab&amp;gt;] ? ldlm_lock_enqueue+0x3fb/0x920 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c18c4f&amp;gt;] ? ldlm_handle_enqueue0+0x4ef/0x10a0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c92562&amp;gt;] ? tgt_enqueue+0x62/0x1d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c94f5a&amp;gt;] ? tgt_handle_request0+0x2ea/0x1490 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa065b4ce&amp;gt;] ? cfs_timer_arm+0xe/0x10 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa066c3af&amp;gt;] ? lc_watchdog_touch+0x6f/0x170 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c3792c&amp;gt;] ? lustre_msg_get_opc+0x9c/0x110 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c9653a&amp;gt;] ? tgt_request_handle+0x43a/0x980 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c4a295&amp;gt;] ? ptlrpc_main+0xd25/0x1970 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff810096f0&amp;gt;] ? __switch_to+0xd0/0x320
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8150e600&amp;gt;] ? thread_return+0x4e/0x76e
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0c49570&amp;gt;] ? ptlrpc_main+0x0/0x1970 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff81096a36&amp;gt;] ? kthread+0x96/0xa0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0ca&amp;gt;] ? child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffff810969a0&amp;gt;] ? kthread+0x0/0xa0
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>Lustre-2.5.52 (server), Lustre-2.5.53(Client)</environment>
        <key id="22764">LU-4499</key>
            <summary>NRS ORR cfs_hash_find_or_add() LBUG</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="jay">Jinshan Xiong</assignee>
                                    <reporter username="ihara">Shuichi Ihara</reporter>
                        <labels>
                            <label>cea</label>
                    </labels>
                <created>Thu, 16 Jan 2014 16:32:59 +0000</created>
                <updated>Tue, 19 Mar 2019 15:45:28 +0000</updated>
                            <resolved>Wed, 26 Aug 2015 17:40:05 +0000</resolved>
                                    <version>Lustre 2.5.0</version>
                    <version>Lustre 2.6.0</version>
                    <version>Lustre 2.8.0</version>
                                    <fixVersion>Lustre 2.8.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>21</watches>
                                                                            <comments>
                            <comment id="75091" author="ihara" created="Thu, 16 Jan 2014 16:34:51 +0000"  >&lt;p&gt;ORR(Object-Based Round Robin) is turned on as NRS policy in this testing.&lt;/p&gt;</comment>
                            <comment id="75208" author="pjones" created="Fri, 17 Jan 2014 19:14:14 +0000"  >&lt;p&gt;Lai&lt;/p&gt;

&lt;p&gt;could you please help with this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="75843" author="laisiyao" created="Wed, 29 Jan 2014 12:20:58 +0000"  >&lt;p&gt;This doesn&apos;t look likely to happen, because though orro-&amp;gt;oo_hnode is not initialise before use, it&apos;s zeroed at allocation time by default. Anyway I composed a patch to initialise it, could you patch it and test on your system?&lt;/p&gt;

&lt;p&gt;Patch is on &lt;a href=&quot;http://review.whamcloud.com/#/c/9046/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/9046/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="80943" author="ihara" created="Thu, 3 Apr 2014 15:23:24 +0000"  >&lt;p&gt;patch &lt;a href=&quot;http://review.whamcloud.com/#/c/9046/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/9046/&lt;/a&gt; doesn&apos;t help. We hit another crach here. &lt;br/&gt;
Just chnage NRS policy to ORR(lctl set_param ost.OSS.ost_io.nrs_policies=orr), run IOR from client, then hit crach on OSS.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;&amp;lt;4&amp;gt;------------[ cut here ]------------
&amp;lt;2&amp;gt;kernel BUG at mm/slab.c:2835!
&amp;lt;4&amp;gt;invalid opcode: 0000 [#1] SMP 
&amp;lt;4&amp;gt;last sysfs file: /sys/devices/pci0000:00/0000:00:03.0/0000:05:00.0/host7/target7:0:0/7:0:0:2/state
&amp;lt;4&amp;gt;CPU 3 
&amp;lt;4&amp;gt;Modules linked in: osp(U) ofd(U) ost(U) mgc(U) fsfilt_ldiskfs(U) osd_ldiskfs(U) ldiskfs(U) lquota(U) jbd2 mdd(U) fid(U) fld(U) ptlrpc(U) ko2iblnd(U) obdc
lass(U) lnet(U) lvfs(U) sha512_generic sha256_generic crc32c_intel libcfs(U) ib_srp(U) scsi_transport_srp(U) bridge stp llc ipmi_devintf dell_rbu nfs lockd 
fscache auth_rpcgss nfs_acl sunrpc rdma_ucm(U) ib_ucm(U) rdma_cm(U) iw_cm(U) ib_ipoib(U) ib_cm(U) ib_uverbs(U) ib_umad(U) mlx5_ib(U) mlx5_core(U) mlx4_en(U)
 mlx4_ib(U) ib_sa(U) ib_mad(U) ib_core(U) ib_addr(U) ipv6 mlx4_core(U) compat(U) dm_round_robin dm_multipath vhost_net macvtap macvlan tun kvm knem(U) power
_meter ses enclosure sg shpchp tg3 dcdbas microcode iTCO_wdt iTCO_vendor_support ext3 jbd mbcache sr_mod cdrom sd_mod crc_t10dif ahci wmi megaraid_sas dm_mi
rror dm_region_hash dm_log dm_mod [last unloaded: speedstep_lib]
&amp;lt;4&amp;gt;
&amp;lt;4&amp;gt;Pid: 1868, comm: ll_ost_io01_002 Not tainted 2.6.32-358.23.2.el6_lustre.x86_64 #1 Dell Inc. PowerEdge R620/01W23F
&amp;lt;4&amp;gt;RIP: 0010:[&amp;lt;ffffffff81167473&amp;gt;]  [&amp;lt;ffffffff81167473&amp;gt;] cache_grow+0x313/0x320
&amp;lt;4&amp;gt;RSP: 0018:ffff881fdf96fc10  EFLAGS: 00010002
&amp;lt;4&amp;gt;RAX: ffff883f50d87c80 RBX: ffff881f879c1b80 RCX: 0000000000000000
&amp;lt;4&amp;gt;RDX: 0000000000000001 RSI: 0000000000041212 RDI: ffff881f879c1b80
&amp;lt;4&amp;gt;RBP: ffff881fdf96fc70 R08: 0000000000000000 R09: 000000000000dee6
&amp;lt;4&amp;gt;R10: 0000000000000000 R11: 0000000000000000 R12: 0000000000041212
&amp;lt;4&amp;gt;R13: ffff883f50d87c40 R14: 0000000000000010 R15: 0000000000000000
&amp;lt;4&amp;gt;FS:  00007f7bccdf8700(0000) GS:ffff8820f0c20000(0000) knlGS:0000000000000000
&amp;lt;4&amp;gt;CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
&amp;lt;4&amp;gt;CR2: 0000000000481000 CR3: 00000040517c6000 CR4: 00000000001407e0
&amp;lt;4&amp;gt;DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
&amp;lt;4&amp;gt;DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
&amp;lt;4&amp;gt;Process ll_ost_io01_002 (pid: 1868, threadinfo ffff881fdf96e000, task ffff88203554e040)
&amp;lt;4&amp;gt;Stack:
&amp;lt;4&amp;gt; 00000000533d4823 0000000000000000 0000000000800000 0800000000000000
&amp;lt;4&amp;gt;&amp;lt;d&amp;gt; 0000000000000000 0000000000002000 000000000000127e ffff881f879c1b80
&amp;lt;4&amp;gt;&amp;lt;d&amp;gt; ffff883fd9162800 ffff883f50d87c40 0000000000000010 ffff883f50d87c60
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffff81167682&amp;gt;] cache_alloc_refill+0x202/0x240
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8116714e&amp;gt;] kmem_cache_alloc_node+0x1be/0x1d0
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa049e8a1&amp;gt;] cfs_mem_cache_cpt_alloc+0x41/0x50 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09ee769&amp;gt;] nrs_orr_res_get+0x5d9/0xba0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09e4b56&amp;gt;] nrs_resource_get+0x56/0x110 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09a5860&amp;gt;] ? lustre_swab_niobuf_remote+0x0/0x30 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09e551b&amp;gt;] nrs_resource_get_safe+0x8b/0x100 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09e7a48&amp;gt;] ptlrpc_nrs_req_initialize+0x38/0x90 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09b4e00&amp;gt;] ptlrpc_main+0x1180/0x1700 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09b3c80&amp;gt;] ? ptlrpc_main+0x0/0x1700 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09b3c80&amp;gt;] ? ptlrpc_main+0x0/0x1700 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09b3c80&amp;gt;] ? ptlrpc_main+0x0/0x1700 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
&amp;lt;4&amp;gt;Code: 0f 1f 84 00 00 00 00 00 49 8d 54 24 30 48 c7 c0 fc ff ff ff 48 89 55 c8 e9 e1 fe ff ff 0f 0b eb fe ba 01 00 00 00 e9 2a fe ff ff &amp;lt;0f&amp;gt; 0b eb fe 66 0
f 1f 84 00 00 00 00 00 55 48 89 e5 41 57 41 56 
&amp;lt;1&amp;gt;RIP  [&amp;lt;ffffffff81167473&amp;gt;] cache_grow+0x313/0x320
&amp;lt;4&amp;gt; RSP &amp;lt;ffff881fdf96fc10&amp;gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="82045" author="laisiyao" created="Mon, 21 Apr 2014 13:51:03 +0000"  >&lt;p&gt;This time it LBUG in kernel mm/slab.c:2835&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;BUG_ON(flags &amp;amp; GFP_SLAB_BUG_MASK)
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;I don&apos;t see how it can happen yet, because it seems in entry of kmem_cache_alloc_node() has adjusted &quot;flags&quot; with &quot;gfp_allowed_mask&quot;, and the only possible flags lustre code will set is GFP_ATOMIC, GFP_NOFS and __GFP_ZERO which are all valid.&lt;/p&gt;

&lt;p&gt;I will do more test to find out the cause.&lt;/p&gt;</comment>
                            <comment id="102610" author="laisiyao" created="Tue, 6 Jan 2015 02:51:10 +0000"  >&lt;p&gt;This may be a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4362&quot; title=&quot;cfs_hash_rehash_key() passed wrong parameters to cfs_hash_keycpy&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4362&quot;&gt;&lt;del&gt;LU-4362&lt;/del&gt;&lt;/a&gt;, could you verify &lt;a href=&quot;http://review.whamcloud.com/#/c/8509/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/8509/&lt;/a&gt; is included in your branch? if not, you may apply it and test again.&lt;/p&gt;</comment>
                            <comment id="115034" author="jamesanunez" created="Tue, 12 May 2015 16:51:10 +0000"  >&lt;p&gt;In the latest version of master, I&apos;m seeing this LBUG in sanityn test 77c. Is this related to &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-6558&quot; title=&quot;replay-single: test_61c, test_90 timeout: nrs_orr_res_get() accessed NULL pointer&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-6558&quot;&gt;&lt;del&gt;LU-6558&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;

&lt;p&gt;Here are some recent test sessions that have failed with this LBUG:&lt;br/&gt;
review-zfs  - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/63ca7db8-f830-11e4-a933-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/63ca7db8-f830-11e4-a933-5254006e85c2&lt;/a&gt;&lt;br/&gt;
review-zfs - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/2d786c4c-f8b8-11e4-bb24-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/2d786c4c-f8b8-11e4-bb24-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="115205" author="jay" created="Wed, 13 May 2015 16:40:58 +0000"  >&lt;p&gt;hit again at: &lt;a href=&quot;https://testing.hpdd.intel.com/test_logs/05f59e66-f989-11e4-939f-5254006e85c2/show_text&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_logs/05f59e66-f989-11e4-939f-5254006e85c2/show_text&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;with the following backtrace:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;00:49:01:LustreError: 12123:0:(hash.c:1256:cfs_hash_find_or_add()) ASSERTION( hlist_unhashed(hnode) ) failed: 
00:49:01:LustreError: 12123:0:(hash.c:1256:cfs_hash_find_or_add()) LBUG
00:49:01:Kernel panic - not syncing: LBUG in interrupt.
00:49:01:
00:49:01:Pid: 12123, comm: ll_ost00_004 Tainted: P           ---------------    2.6.32-504.16.2.el6_lustre.gd805a88.x86_64 #1
00:49:01:Call Trace:
00:49:01: [&amp;lt;ffffffff81529fbc&amp;gt;] ? panic+0xa7/0x16f
00:49:01: [&amp;lt;ffffffffa0709ebd&amp;gt;] ? lbug_with_loc+0x8d/0xb0 [libcfs]
00:49:01: [&amp;lt;ffffffffa071df20&amp;gt;] ? cfs_hash_findadd_unique+0x0/0x30 [libcfs]
00:49:01: [&amp;lt;ffffffffa071df38&amp;gt;] ? cfs_hash_findadd_unique+0x18/0x30 [libcfs]
00:49:01: [&amp;lt;ffffffffa0aceb4b&amp;gt;] ? nrs_orr_res_get+0x43b/0xc30 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0ac4fb6&amp;gt;] ? nrs_resource_get+0x56/0x110 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a83665&amp;gt;] ? lustre_msg_buf+0x55/0x60 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0ac597b&amp;gt;] ? nrs_resource_get_safe+0x8b/0x100 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0ac807b&amp;gt;] ? ptlrpc_nrs_req_hp_move+0x6b/0x210 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0aab445&amp;gt;] ? req_capsule_client_get+0x15/0x20 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a633f8&amp;gt;] ? ldlm_server_blocking_ast+0x228/0x8b0 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0ae1ba1&amp;gt;] ? tgt_blocking_ast+0x1b1/0x8b0 [ptlrpc]
00:49:01: [&amp;lt;ffffffff812975c4&amp;gt;] ? snprintf+0x34/0x40
00:49:01: [&amp;lt;ffffffffa0a36dbd&amp;gt;] ? ldlm_work_bl_ast_lock+0xdd/0x290 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a791c4&amp;gt;] ? ptlrpc_set_wait+0x74/0x900 [ptlrpc]
00:49:01: [&amp;lt;ffffffff81174c13&amp;gt;] ? kmem_cache_alloc_trace+0x1b3/0x1c0
00:49:01: [&amp;lt;ffffffff81174f6c&amp;gt;] ? __kmalloc+0x21c/0x230
00:49:01: [&amp;lt;ffffffffa0a758d2&amp;gt;] ? ptlrpc_prep_set+0x112/0x2e0 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a36ce0&amp;gt;] ? ldlm_work_bl_ast_lock+0x0/0x290 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a38f7b&amp;gt;] ? ldlm_run_ast_work+0x1db/0x470 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a50685&amp;gt;] ? ldlm_process_extent_lock+0x155/0xab0 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a3883b&amp;gt;] ? ldlm_lock_enqueue+0x46b/0x9d0 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a6472b&amp;gt;] ? ldlm_handle_enqueue0+0x51b/0x13f0 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0ae56b1&amp;gt;] ? tgt_enqueue+0x61/0x230 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0ae61ce&amp;gt;] ? tgt_request_handle+0x94e/0x10a0 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a95bf1&amp;gt;] ? ptlrpc_main+0xe41/0x1970 [ptlrpc]
00:49:01: [&amp;lt;ffffffffa0a94db0&amp;gt;] ? ptlrpc_main+0x0/0x1970 [ptlrpc]
00:49:01: [&amp;lt;ffffffff8109e71e&amp;gt;] ? kthread+0x9e/0xc0
00:49:01: [&amp;lt;ffffffff8100c20a&amp;gt;] ? child_rip+0xa/0x20
00:49:01: [&amp;lt;ffffffff8109e680&amp;gt;] ? kthread+0x0/0xc0
00:49:01: [&amp;lt;ffffffff8100c200&amp;gt;] ? child_rip+0x0/0x20
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="115242" author="jay" created="Wed, 13 May 2015 18:58:51 +0000"  >&lt;p&gt;It seems like a memory corruption issue.&lt;/p&gt;</comment>
                            <comment id="116139" author="yujian" created="Thu, 21 May 2015 21:05:07 +0000"  >&lt;p&gt;More instances on master branch:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/d086aa90-fffa-11e4-a3db-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/d086aa90-fffa-11e4-a3db-5254006e85c2&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/2d9d9918-ff2f-11e4-be81-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/2d9d9918-ff2f-11e4-be81-5254006e85c2&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/2d9d9918-ff2f-11e4-be81-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/2d9d9918-ff2f-11e4-be81-5254006e85c2&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/b8f327a0-fec9-11e4-a4ed-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/b8f327a0-fec9-11e4-a4ed-5254006e85c2&lt;/a&gt;&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/d505ade0-fe8e-11e4-919c-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/d505ade0-fe8e-11e4-919c-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="116252" author="bogl" created="Fri, 22 May 2015 21:20:31 +0000"  >&lt;p&gt;another on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/3916eec4-00c5-11e5-9650-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/3916eec4-00c5-11e5-9650-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="116429" author="adilger" created="Tue, 26 May 2015 17:46:57 +0000"  >&lt;p&gt;This is failing about twice a day on average.  It has been hitting regularly since 2015-05-04, so maybe some patch that landed within the previous day or two caused this problem to fail more often?&lt;/p&gt;

&lt;p&gt;In hindsight, that is because the NRS testing was enabled via &lt;a href=&quot;http://review.whamcloud.com/9286&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/9286&lt;/a&gt; &quot;&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3266&quot; title=&quot;Regression tests for NRS policies&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3266&quot;&gt;&lt;del&gt;LU-3266&lt;/del&gt;&lt;/a&gt; test: regression tests for nrs policies&quot; on 2015-05-01, so the bug itself has probably been around a long time.&lt;/p&gt;</comment>
                            <comment id="117447" author="sebastien.buisson" created="Thu, 4 Jun 2015 15:52:16 +0000"  >&lt;p&gt;Hi,&lt;/p&gt;

&lt;p&gt;One more instance:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/320f7778-09c5-11e5-8421-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/320f7778-09c5-11e5-8421-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="119159" author="bogl" created="Fri, 19 Jun 2015 22:51:54 +0000"  >&lt;p&gt;another on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/92cbbd1a-16d1-11e5-8436-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/92cbbd1a-16d1-11e5-8436-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="119922" author="jamesanunez" created="Tue, 30 Jun 2015 14:15:23 +0000"  >&lt;p&gt;Several recent failures on master:&lt;br/&gt;
2015-06-25 04:16:38 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/3777cfde-1b55-11e5-ac09-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/3777cfde-1b55-11e5-ac09-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2015-06-25 10:17:54 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/a76ea20e-1b9b-11e5-ac09-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/a76ea20e-1b9b-11e5-ac09-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2015-06-26 15:02:25 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/474e2b02-1c76-11e5-9e33-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/474e2b02-1c76-11e5-9e33-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2015-06-27 09:20:38  - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/a148e48a-1d16-11e5-9df2-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/a148e48a-1d16-11e5-9df2-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2015-06-29 10:47:41 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/923d2e80-1eae-11e5-8f20-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/923d2e80-1eae-11e5-8f20-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="121318" author="bzzz" created="Wed, 15 Jul 2015 06:08:10 +0000"  >&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/1bbf8b9a-2a6b-11e5-b04d-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/1bbf8b9a-2a6b-11e5-b04d-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="121533" author="bogl" created="Fri, 17 Jul 2015 14:19:36 +0000"  >&lt;p&gt;another on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/d2ef2ba8-2c15-11e5-8c67-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/d2ef2ba8-2c15-11e5-8c67-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="121661" author="bzzz" created="Mon, 20 Jul 2015 12:40:30 +0000"  >&lt;p&gt;&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/f8aae4b0-2d58-11e5-831c-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/f8aae4b0-2d58-11e5-831c-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="121807" author="hdoreau" created="Tue, 21 Jul 2015 15:24:06 +0000"  >&lt;p&gt;This is not an ORR-only issue, we hit it on CRR-N too on a MDS:&lt;/p&gt;

&lt;p&gt;  #0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f4c8&amp;#93;&lt;/span&gt; machine_kexec at ffffffff8103b5bb&lt;br/&gt;
  #1 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f528&amp;#93;&lt;/span&gt; crash_kexec at ffffffff810c9c82&lt;br/&gt;
  #2 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f5f8&amp;#93;&lt;/span&gt; panic at ffffffff81529b1e&lt;br/&gt;
  #3 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f678&amp;#93;&lt;/span&gt; lbug_with_loc at ffffffffa038aedd &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
  #4 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f6f8&amp;#93;&lt;/span&gt; cfs_hash_findadd_unique at ffffffffa03a2db8 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
  #5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f718&amp;#93;&lt;/span&gt; nrs_crrn_res_get at ffffffffa06a7a93 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
  #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f758&amp;#93;&lt;/span&gt; nrs_resource_get at ffffffffa06a1116 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
  #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f7b8&amp;#93;&lt;/span&gt; nrs_resource_get_safe at ffffffffa06a1adb &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
  #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f7f8&amp;#93;&lt;/span&gt; ptlrpc_nrs_req_hp_move at ffffffffa06a42b8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
  #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f848&amp;#93;&lt;/span&gt; ldlm_server_blocking_ast at ffffffffa0642018 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f898&amp;#93;&lt;/span&gt; ldlm_work_bl_ast_lock at ffffffffa061538d &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f918&amp;#93;&lt;/span&gt; ptlrpc_set_wait at ffffffffa065648c &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f9b8&amp;#93;&lt;/span&gt; ldlm_run_ast_work at ffffffffa061800b &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3f9e8&amp;#93;&lt;/span&gt; ldlm_process_inodebits_lock at ffffffffa0646507 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fa68&amp;#93;&lt;/span&gt; ldlm_lock_enqueue at ffffffffa06175b5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #15 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fac8&amp;#93;&lt;/span&gt; ldlm_cli_enqueue_local at ffffffffa0636b53 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #16 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fb48&amp;#93;&lt;/span&gt; mdt_object_lock0 at ffffffffa0c988f6 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #17 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fbf8&amp;#93;&lt;/span&gt; mdt_object_lock at ffffffffa0c99334 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #18 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fc08&amp;#93;&lt;/span&gt; mdt_reint_unlink at ffffffffa0cb1cce &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #19 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fc88&amp;#93;&lt;/span&gt; mdt_reint_rec at ffffffffa0cae671 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #20 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fca8&amp;#93;&lt;/span&gt; mdt_reint_internal at ffffffffa0c93cb3 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #21 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fce8&amp;#93;&lt;/span&gt; mdt_reint at ffffffffa0c93fb4 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #22 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fd08&amp;#93;&lt;/span&gt; mdt_handle_common at ffffffffa0c96aba &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #23 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fd58&amp;#93;&lt;/span&gt; mds_regular_handle at ffffffffa0cd3985 &lt;span class=&quot;error&quot;&gt;&amp;#91;mdt&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #24 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fd68&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa0670cf5 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #25 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fe48&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa067205d &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
 #26 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3fee8&amp;#93;&lt;/span&gt; kthread at ffffffff8109e66e&lt;br/&gt;
 #27 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff880ffaa3ff48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100c20a&lt;/p&gt;</comment>
                            <comment id="121812" author="bfaccini" created="Tue, 21 Jul 2015 15:44:30 +0000"  >&lt;p&gt;Hello Henri, I think the CRR-N needs the same kind of patch that Lai had pushed for ORR!&lt;br/&gt;
Lai, why did you have decided to finally abandon your original patch ??&lt;/p&gt;
</comment>
                            <comment id="121814" author="jay" created="Tue, 21 Jul 2015 15:50:48 +0000"  >&lt;p&gt;Bruno,&lt;/p&gt;

&lt;p&gt;That patch didn&apos;t address the problem. This looks like a memory corruption issue where mostly like a piece of freed memory was accessed and written again. Later on this piece of memory was allocated and used by NRS.&lt;/p&gt;</comment>
                            <comment id="121817" author="bfaccini" created="Tue, 21 Jul 2015 16:05:18 +0000"  >&lt;p&gt;Just to be complete, one of my auto-tests session (&lt;a href=&quot;https://testing.hpdd.intel.com/test_sessions/01e63cdc-2fa7-11e5-97d6-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sessions/01e63cdc-2fa7-11e5-97d6-5254006e85c2&lt;/a&gt;) has experienced the original LBUG/problem for this ticket and it looks like only the whole struct nrs_orr_object just being (re?) allocated has been poisonned causing the LBUG :&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;
Concerned struct nrs_orr_object at 0xffff88006e3c2fa0 :
$4 = {
  oo_res = {
    res_parent = 0x5a5a5a5a5a5a5a5a, 
    res_policy = 0x5a5a5a5a5a5a5a5a
  }, 
  oo_hnode = {
    next = 0x5a5a5a5a5a5a5a5a, 
    pprev = 0x5a5a5a5a5a5a5a5a  &amp;lt;&amp;lt;&amp;lt;&amp;lt; causing the LBUG!
  }, 
  oo_round = 0x5a5a5a5a5a5a5a5a, 
  oo_sequence = 0x5a5a5a5a5a5a5a5a, 
  oo_key = {                &amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;  has just been initialized in nrs_orr_res_get()
    {
      ok_fid = {
        f_seq = 0x100000000, 
        f_oid = 0x794e, 
        f_ver = 0x0
      }, 
      ok_idx = 0x0
    }
  }, 
  oo_ref = 0x1,         &amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;&amp;lt;  has just been initialized in nrs_orr_res_get()
  oo_quantum = 0x5a5a, 
  oo_active = 0x5a5a
}

Slab containing this struct :
ACHE            NAME                 OBJSIZE  ALLOCATED     TOTAL  SLABS  SSIZE
ffff880079bb4500 nrs_orr_hp_0              80          2        48      1     4k
SLAB              MEMORY            TOTAL  ALLOCATED  FREE
ffff88006e3c2000  ffff88006e3c20f0     48          2    46
FREE / [ALLOCATED]
  [ffff88006e3c2fa0]

      PAGE       PHYSICAL      MAPPING       INDEX CNT FLAGS
ffffea000181d270 6e3c2000                0 ffff88003757ad80  1 20000000000080

Memory around in same Slab and only/also poisonned :
ffff88006e3c25a0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c25b0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c25c0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c25d0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c25e0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fa0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fb0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fc0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fe0:  0000000000000001 5a5a5a5a5a5a5a5a   ........ZZZZZZZZ

Where:
CACHE            NAME                 OBJSIZE  ALLOCATED     TOTAL  SLABS  SSIZE
ffff880079bb4500 nrs_orr_hp_0              80          2        48      1     4k
SLAB              MEMORY            TOTAL  ALLOCATED  FREE
ffff88006e3c2000  ffff88006e3c20f0     48          2    46
FREE / [ALLOCATED]
   ffff88006e3c25a0  (cpu 0 cache)

      PAGE       PHYSICAL      MAPPING       INDEX CNT FLAGS
ffffea000181d270 6e3c2000                0 ffff88003757ad80  1 20000000000080

So only an other free nrs_orr_object in same Slab and the one just allocated causing the LBUG !!
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="121840" author="bfaccini" created="Tue, 21 Jul 2015 16:42:02 +0000"  >&lt;p&gt;Hello Jinshan, I agree that this is confusing and looking as a corruption, but if you have a look at my crash-dump extracts, it should have been a very precise one!! By the way even the end of the Slab, right after the concerned nrs_orr_object has been preserved :&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;ffff88006e3c2f60:  0000000000000000 0000000000000000   ................
ffff88006e3c2f70:  0000000000000000 0000000000000000   ................
ffff88006e3c2f80:  0000000000000000 0000000000000000   ................
ffff88006e3c2f90:  0000000000000000 0000000000000000   ................
ffff88006e3c2fa0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fb0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fc0:  5a5a5a5a5a5a5a5a 5a5a5a5a5a5a5a5a   ZZZZZZZZZZZZZZZZ
ffff88006e3c2fd0:  0000000100000000 000000000000794e   ........Ny......
ffff88006e3c2fe0:  0000000000000001 5a5a5a5a5a5a5a5a   ........ZZZZZZZZ
ffff88006e3c2ff0:  0000000000000000 0000000001a87067   ........gp......
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="122001" author="jamesanunez" created="Thu, 23 Jul 2015 14:54:08 +0000"  >&lt;p&gt;Another case:&lt;br/&gt;
2015-07-22 13:58:00 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/e15f2588-30bd-11e5-ae23-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/e15f2588-30bd-11e5-ae23-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="122344" author="bogl" created="Mon, 27 Jul 2015 23:01:05 +0000"  >&lt;p&gt;another on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/ff5a31b8-308b-11e5-aa87-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/ff5a31b8-308b-11e5-aa87-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="122544" author="jamesanunez" created="Wed, 29 Jul 2015 14:38:16 +0000"  >&lt;p&gt;More from master review-zfs-part-1:&lt;br/&gt;
2015-07-28 20:20:41 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/7b300648-35a3-11e5-b949-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/7b300648-35a3-11e5-b949-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2015-07-28 22:07:39 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/8927e85c-35ac-11e5-bbc3-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/8927e85c-35ac-11e5-bbc3-5254006e85c2&lt;/a&gt;&lt;br/&gt;
2015-07-29 04:24:48 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/c3dfd67e-35e5-11e5-8c30-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/c3dfd67e-35e5-11e5-8c30-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="122940" author="bogl" created="Sat, 1 Aug 2015 21:21:19 +0000"  >&lt;p&gt;another on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/5bfd264e-3886-11e5-9969-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/5bfd264e-3886-11e5-9969-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="122948" author="bogl" created="Sun, 2 Aug 2015 19:35:10 +0000"  >&lt;p&gt;another on master:&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/b9aec8d4-38ee-11e5-8dec-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/b9aec8d4-38ee-11e5-8dec-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="123401" author="di.wang" created="Wed, 5 Aug 2015 20:45:39 +0000"  >&lt;p&gt;hit again&lt;br/&gt;
&lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/c6cd44f2-3b53-11e5-95fa-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/c6cd44f2-3b53-11e5-95fa-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="123474" author="jay" created="Thu, 6 Aug 2015 16:50:57 +0000"  >&lt;p&gt;I made a patch at: &lt;a href=&quot;http://review.whamcloud.com/15670&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/15670&lt;/a&gt; to reproduce it with MALLOC debug flag set.&lt;/p&gt;</comment>
                            <comment id="123778" author="jay" created="Mon, 10 Aug 2015 19:40:30 +0000"  >&lt;p&gt;I&apos;m working on this issue.&lt;/p&gt;</comment>
                            <comment id="123815" author="gerrit" created="Tue, 11 Aug 2015 03:47:22 +0000"  >&lt;p&gt;Jinshan Xiong (jinshan.xiong@intel.com) uploaded a new patch: &lt;a href=&quot;http://review.whamcloud.com/15943&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/15943&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4499&quot; title=&quot;NRS ORR cfs_hash_find_or_add() LBUG&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4499&quot;&gt;&lt;del&gt;LU-4499&lt;/del&gt;&lt;/a&gt; nrs: adjust the order of REQ NRS initilization&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: 1&lt;br/&gt;
Commit: 263a722ce77cac0fe55f316c100e83b92b451064&lt;/p&gt;</comment>
                            <comment id="124954" author="jamesanunez" created="Mon, 24 Aug 2015 20:24:47 +0000"  >&lt;p&gt;We hit this bug again:&lt;br/&gt;
2015-08-21 10:39:47 - &lt;a href=&quot;https://testing.hpdd.intel.com/test_sets/3147f89a-4829-11e5-8db5-5254006e85c2&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://testing.hpdd.intel.com/test_sets/3147f89a-4829-11e5-8db5-5254006e85c2&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="125193" author="gerrit" created="Wed, 26 Aug 2015 15:32:34 +0000"  >&lt;p&gt;Oleg Drokin (oleg.drokin@intel.com) merged in patch &lt;a href=&quot;http://review.whamcloud.com/15943/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/15943/&lt;/a&gt;&lt;br/&gt;
Subject: &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4499&quot; title=&quot;NRS ORR cfs_hash_find_or_add() LBUG&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4499&quot;&gt;&lt;del&gt;LU-4499&lt;/del&gt;&lt;/a&gt; nrs: adjust the order of REQ NRS initilization&lt;br/&gt;
Project: fs/lustre-release&lt;br/&gt;
Branch: master&lt;br/&gt;
Current Patch Set: &lt;br/&gt;
Commit: f904a6617b57eb8b4b90f5bc198bdec758133922&lt;/p&gt;</comment>
                            <comment id="125223" author="jgmitter" created="Wed, 26 Aug 2015 17:40:05 +0000"  >&lt;p&gt;Landed for 2.8.&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10010">
                    <name>Duplicate</name>
                                                                <inwardlinks description="is duplicated by">
                                        <issuelink>
            <issuekey id="30348">LU-6633</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                                        </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="31849">LU-7084</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="30521">LU-6688</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwcyv:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>12304</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>