<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:29:50 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-2970] ASSERTION( !list_empty(&amp;h-&gt;loh_layers) ) failed, followed by a kernel panic</title>
                <link>https://jira.whamcloud.com/browse/LU-2970</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;One of our lustre clients crashed yesterday with the following kernel panic:&lt;/p&gt;

&lt;p&gt;2013-03-14T16:24:25+01:00 brutus3 LustreError: 4488:0:(lu_object.h:759:lu_object_top()) ASSERTION( !list_empty(&amp;amp;h-&amp;gt;loh_layers) ) failed: &lt;br/&gt;
2013-03-14T16:24:25+01:00 brutus3 general protection fault: 0000 &lt;a href=&quot;#1&quot; target=&quot;_blank&quot; rel=&quot;noopener&quot;&gt;1&lt;/a&gt; SMP &lt;br/&gt;
2013-03-14T16:24:25+01:00 brutus3 last sysfs file: /sys/devices/system/cpu/cpu47/cache/index2/shared_cpu_map&lt;br/&gt;
2013-03-14T16:24:25+01:00 brutus3 CPU 28 &lt;br/&gt;
2013-03-14T16:24:25+01:00 brutus3 Modules linked in: lmv(U) mgc(U) lustre(U) lov(U) osc(U) mdc(U) fid(U) fld(U) ko2iblnd(U) ptlrpc(U) obdclass(U) lvfs(U) lnet(U) sha512_generic sha256_generic libcfs(U) netconsole configfs panfs(P)(U) autofs4 nfs fscache nfs_acl auth_rpcg&lt;br/&gt;
ss lockd sunrpc bonding 8021q garp stp llc nf_conntrack_ipv4 nf_defrag_ipv4 xt_state nf_conntrack iptable_filter ip_tables ib_ipoib rdma_ucm ib_ucm ib_uverbs ib_umad rdma_cm ib_cm iw_cm ib_addr ipv6 ib_sa mlx4_ib ib_mad ib_core mlx4_en mlx4_core power_meter sg hpilo hpwd&lt;br/&gt;
t netxen_nic microcode serio_raw k10temp amd64_edac_mod edac_core edac_mce_amd i2c_piix4 shpchp ext4 mbcache jbd2 sd_mod crc_t10dif hpsa ata_generic pata_acpi pata_atiixp ahci radeon ttm drm_kms_helper drm i2c_algo_bit i2c_core dm_mirror dm_region_hash dm_log dm_mod [las&lt;br/&gt;
t unloaded: scsi_wait_scan]&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 &lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 Pid: 9597, comm: ldlm_bl_101 Tainted: P           ---------------    2.6.32-279.22.1.el6.x86_64 #1 HP ProLiant DL585 G7&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 RIP: 0010:&lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d128cb&amp;gt;&amp;#93;&lt;/span&gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d128cb&amp;gt;&amp;#93;&lt;/span&gt; cl_object_top+0x1b/0x150 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 RSP: 0018:ffff880551501ba0  EFLAGS: 00010206&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 RAX: 5a5a5a5a5a5a5a5a RBX: ffff880b44368400 RCX: ffff8801824afe08&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 RDX: 5a5a5a5a5a5a5a5a RSI: ffffffffa10dd860 RDI: ffff880388e153c8&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 RBP: ffff880551501bb0 R08: 0000000000000000 R09: 0000000000000000&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 R10: 0000000000000000 R11: 0000000000000000 R12: ffff88099c331e00&lt;br/&gt;
2013-03-14T16:24:26+01:00 brutus3 R13: ffff8812ee62b290 R14: ffff880388e153c8 R15: ffff8811ca34ebc8&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 FS:  00007f248980f700(0000) GS:ffff88044e440000(0000) knlGS:0000000008ec3830&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 CR2: 00000000006d3a30 CR3: 0000001835b46000 CR4: 00000000000006e0&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 Process ldlm_bl_101 (pid: 9597, threadinfo ffff880551500000, task ffff8808351d6040)&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 Stack:&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 ffff880551501bc0 ffff880b44368400 ffff880551501bc0 ffffffffa0d12a2e&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 syslog-ng&lt;span class=&quot;error&quot;&gt;&amp;#91;2221&amp;#93;&lt;/span&gt;: Error processing log message: &amp;lt;d&amp;gt; ffff880551501c00 ffffffffa10b3b24 0000000000000000 ffff8812ee62b290&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 syslog-ng&lt;span class=&quot;error&quot;&gt;&amp;#91;2221&amp;#93;&lt;/span&gt;: Error processing log message: &amp;lt;d&amp;gt; ffff8812ee62b290 ffff88099c331e00 ffff88099c331e00 ffff880551501cb0&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 Call Trace:&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d12a2e&amp;gt;&amp;#93;&lt;/span&gt; cl_object_attr_lock+0xe/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b3b24&amp;gt;&amp;#93;&lt;/span&gt; osc_lock_detach+0xf4/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b3c08&amp;gt;&amp;#93;&lt;/span&gt; osc_lock_delete+0x48/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:27+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1ab65&amp;gt;&amp;#93;&lt;/span&gt; cl_lock_delete0+0xb5/0x1d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1add3&amp;gt;&amp;#93;&lt;/span&gt; cl_lock_delete+0x153/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b5846&amp;gt;&amp;#93;&lt;/span&gt; osc_ldlm_blocking_ast+0x146/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e33f2c&amp;gt;&amp;#93;&lt;/span&gt; ldlm_cancel_callback+0x6c/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e42dda&amp;gt;&amp;#93;&lt;/span&gt; ldlm_cli_cancel_local+0x8a/0x470 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e478db&amp;gt;&amp;#93;&lt;/span&gt; ldlm_cli_cancel+0x5b/0x360 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b4259&amp;gt;&amp;#93;&lt;/span&gt; osc_lock_cancel+0xf9/0x1c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1392d&amp;gt;&amp;#93;&lt;/span&gt; ? cl_env_nested_get+0x5d/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d19645&amp;gt;&amp;#93;&lt;/span&gt; cl_lock_cancel0+0x75/0x160 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1a1eb&amp;gt;&amp;#93;&lt;/span&gt; cl_lock_cancel+0x13b/0x140 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b583a&amp;gt;&amp;#93;&lt;/span&gt; osc_ldlm_blocking_ast+0x13a/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b070&amp;gt;&amp;#93;&lt;/span&gt; ldlm_handle_bl_callback+0x130/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b5c1&amp;gt;&amp;#93;&lt;/span&gt; ldlm_bl_thread_main+0x281/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:28+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105fa40&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0ca&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0c0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 Code: c7 80 1f d6 a0 e8 a6 25 e9 ff 66 0f 1f 44 00 00 55 48 89 e5 53 48 83 ec 08 0f 1f 44 00 00 48 8b 07 0f 1f 80 00 00 00 00 48 89 c2 &amp;lt;48&amp;gt; 8b 80 88 00 00 00 48 85 c0 75 f1 48 8b 42 48 48 83 c2 48 48 &lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 RIP  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d128cb&amp;gt;&amp;#93;&lt;/span&gt; cl_object_top+0x1b/0x150 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 RSP &amp;lt;ffff880551501ba0&amp;gt;&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 --&lt;del&gt;[ end trace 4537c3429b809b37 ]&lt;/del&gt;--&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 Kernel panic - not syncing: Fatal exception&lt;br/&gt;
2013-03-14T16:24:29+01:00 brutus3 Pid: 9597, comm: ldlm_bl_101 Tainted: P      D    ---------------    2.6.32-279.22.1.el6.x86_64 #1&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 Call Trace:&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814e9903&amp;gt;&amp;#93;&lt;/span&gt; ? panic+0xa0/0x168&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814eda94&amp;gt;&amp;#93;&lt;/span&gt; ? oops_end+0xe4/0x100&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100f19b&amp;gt;&amp;#93;&lt;/span&gt; ? die+0x5b/0x90&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814ed602&amp;gt;&amp;#93;&lt;/span&gt; ? do_general_protection+0x152/0x160&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814ecdd5&amp;gt;&amp;#93;&lt;/span&gt; ? general_protection+0x25/0x30&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d128cb&amp;gt;&amp;#93;&lt;/span&gt; ? cl_object_top+0x1b/0x150 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d12a2e&amp;gt;&amp;#93;&lt;/span&gt; ? cl_object_attr_lock+0xe/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b3b24&amp;gt;&amp;#93;&lt;/span&gt; ? osc_lock_detach+0xf4/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b3c08&amp;gt;&amp;#93;&lt;/span&gt; ? osc_lock_delete+0x48/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1ab65&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_delete0+0xb5/0x1d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1add3&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_delete+0x153/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b5846&amp;gt;&amp;#93;&lt;/span&gt; ? osc_ldlm_blocking_ast+0x146/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:30+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e33f2c&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cancel_callback+0x6c/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e42dda&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cli_cancel_local+0x8a/0x470 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e478db&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cli_cancel+0x5b/0x360 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b4259&amp;gt;&amp;#93;&lt;/span&gt; ? osc_lock_cancel+0xf9/0x1c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1392d&amp;gt;&amp;#93;&lt;/span&gt; ? cl_env_nested_get+0x5d/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d19645&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_cancel0+0x75/0x160 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1a1eb&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_cancel+0x13b/0x140 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b583a&amp;gt;&amp;#93;&lt;/span&gt; ? osc_ldlm_blocking_ast+0x13a/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b070&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_handle_bl_callback+0x130/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b5c1&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x281/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105fa40&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:31+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0ca&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0xa/0x20&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0c0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 -----------&lt;del&gt;[ cut here ]&lt;/del&gt;-----------&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 WARNING: at arch/x86/kernel/smp.c:117 native_smp_send_reschedule+0x5c/0x60() (Tainted: P      D    ---------------   )&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 Hardware name: ProLiant DL585 G7&lt;br/&gt;
2013-03-14T16:24:32+01:00 brutus3 Modules linked in: lmv(U) mgc(U) lustre(U) lov(U) osc(U) mdc(U) fid(U) fld(U) ko2iblnd(U) ptlrpc(U) obdclass(U) lvfs(U) lnet(U) sha512_generic sha256_generic libcfs(U) netconsole configfs panfs(P)(U) autofs4 nfs fscache nfs_acl auth_rpcgss lockd sunrpc bonding 8021q garp stp llc nf_conntrack_ipv4 nf_defrag_ipv4 xt_state nf_conntrack iptable_filter ip_tables ib_ipoib rdma_ucm ib_ucm ib_uverbs ib_umad rdma_cm ib_cm iw_cm ib_addr ipv6 ib_sa mlx4_ib ib_mad ib_core mlx4_en mlx4_core power_meter sg hpilo hpwdt netxen_nic microcode serio_raw k10temp amd64_edac_mod edac_core edac_mce_amd i2c_piix4 shpchp ext4 mbcache jbd2 sd_mod crc_t10dif hpsa ata_generic pata_acpi pata_atiixp ahci radeon ttm drm_kms_helper drm i2c_algo_bit i2c_core dm_mirror dm_region_hash dm_log dm_mod &lt;span class=&quot;error&quot;&gt;&amp;#91;last unloaded: scsi_wait_scan&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 Pid: 9597, comm: ldlm_bl_101 Tainted: P      D    ---------------    2.6.32-279.22.1.el6.x86_64 #1&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 Call Trace:&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 &amp;lt;IRQ&amp;gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8106a2a7&amp;gt;&amp;#93;&lt;/span&gt; ? warn_slowpath_common+0x87/0xc0&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8106a2fa&amp;gt;&amp;#93;&lt;/span&gt; ? warn_slowpath_null+0x1a/0x20&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8102a26c&amp;gt;&amp;#93;&lt;/span&gt; ? native_smp_send_reschedule+0x5c/0x60&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e048&amp;gt;&amp;#93;&lt;/span&gt; ? resched_task+0x68/0x80&lt;br/&gt;
2013-03-14T16:24:33+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81053a60&amp;gt;&amp;#93;&lt;/span&gt; ? check_preempt_wakeup+0x1c0/0x260&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8106210b&amp;gt;&amp;#93;&lt;/span&gt; ? enqueue_task_fair+0xfb/0x100&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e0fc&amp;gt;&amp;#93;&lt;/span&gt; ? check_preempt_curr+0x7c/0x90&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105f873&amp;gt;&amp;#93;&lt;/span&gt; ? try_to_wake_up+0x213/0x3e0&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81094d40&amp;gt;&amp;#93;&lt;/span&gt; ? hrtimer_wakeup+0x0/0x30&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105fa95&amp;gt;&amp;#93;&lt;/span&gt; ? wake_up_process+0x15/0x20&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81094d62&amp;gt;&amp;#93;&lt;/span&gt; ? hrtimer_wakeup+0x22/0x30&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8109535e&amp;gt;&amp;#93;&lt;/span&gt; ? __run_hrtimer+0x8e/0x1a0&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81012a69&amp;gt;&amp;#93;&lt;/span&gt; ? read_tsc+0x9/0x20&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81095706&amp;gt;&amp;#93;&lt;/span&gt; ? hrtimer_interrupt+0xe6/0x250&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814f235b&amp;gt;&amp;#93;&lt;/span&gt; ? smp_apic_timer_interrupt+0x6b/0x9b&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100bb93&amp;gt;&amp;#93;&lt;/span&gt; ? apic_timer_interrupt+0x13/0x20&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &amp;lt;EOI&amp;gt;  &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81274465&amp;gt;&amp;#93;&lt;/span&gt; ? delay_tsc+0x45/0x80&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81274447&amp;gt;&amp;#93;&lt;/span&gt; ? delay_tsc+0x27/0x80&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81274416&amp;gt;&amp;#93;&lt;/span&gt; ? __const_udelay+0x46/0x50&lt;br/&gt;
2013-03-14T16:24:34+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8102a3e3&amp;gt;&amp;#93;&lt;/span&gt; ? native_stop_other_cpus+0x83/0xd0&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814e9919&amp;gt;&amp;#93;&lt;/span&gt; ? panic+0xb6/0x168&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814eda94&amp;gt;&amp;#93;&lt;/span&gt; ? oops_end+0xe4/0x100&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100f19b&amp;gt;&amp;#93;&lt;/span&gt; ? die+0x5b/0x90&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814ed602&amp;gt;&amp;#93;&lt;/span&gt; ? do_general_protection+0x152/0x160&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff814ecdd5&amp;gt;&amp;#93;&lt;/span&gt; ? general_protection+0x25/0x30&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d128cb&amp;gt;&amp;#93;&lt;/span&gt; ? cl_object_top+0x1b/0x150 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d12a2e&amp;gt;&amp;#93;&lt;/span&gt; ? cl_object_attr_lock+0xe/0x20 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b3b24&amp;gt;&amp;#93;&lt;/span&gt; ? osc_lock_detach+0xf4/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b3c08&amp;gt;&amp;#93;&lt;/span&gt; ? osc_lock_delete+0x48/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1ab65&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_delete0+0xb5/0x1d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1add3&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_delete+0x153/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b5846&amp;gt;&amp;#93;&lt;/span&gt; ? osc_ldlm_blocking_ast+0x146/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:35+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e33f2c&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cancel_callback+0x6c/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e42dda&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cli_cancel_local+0x8a/0x470 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e478db&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_cli_cancel+0x5b/0x360 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b4259&amp;gt;&amp;#93;&lt;/span&gt; ? osc_lock_cancel+0xf9/0x1c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1392d&amp;gt;&amp;#93;&lt;/span&gt; ? cl_env_nested_get+0x5d/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d19645&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_cancel0+0x75/0x160 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0d1a1eb&amp;gt;&amp;#93;&lt;/span&gt; ? cl_lock_cancel+0x13b/0x140 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa10b583a&amp;gt;&amp;#93;&lt;/span&gt; ? osc_ldlm_blocking_ast+0x13a/0x350 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b070&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_handle_bl_callback+0x130/0x400 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b5c1&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x281/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105fa40&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:36+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0ca&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0xa/0x20&lt;br/&gt;
2013-03-14T16:24:37+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:37+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0e4b340&amp;gt;&amp;#93;&lt;/span&gt; ? ldlm_bl_thread_main+0x0/0x3d0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2013-03-14T16:24:37+01:00 brutus3 &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100c0c0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
2013-03-14T16:24:37+01:00 brutus3 --&lt;del&gt;[ end trace 4537c3429b809b38 ]&lt;/del&gt;--&lt;br/&gt;
2013-03-14T16:24:37+01:00 brutus3 panic occurred, switching back to text console&lt;/p&gt;


&lt;p&gt;Unfortunately i have no idea what process caused the panic: The affected node is a login node and there were about 50 people logged in, so i have no easy way to reproduce the crash :-/&lt;/p&gt;

&lt;p&gt;The lustre kernel module was compiled from the v2_3_61_0 git tag.&lt;/p&gt;
</description>
                <environment>CentOS 6.3 (kernel 2.6.32-279.22.1.el6.x86_64)&lt;br/&gt;
Lustre Client: v2_3_61_0 (git version)</environment>
        <key id="17908">LU-2970</key>
            <summary>ASSERTION( !list_empty(&amp;h-&gt;loh_layers) ) failed, followed by a kernel panic</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="jay">Jinshan Xiong</assignee>
                                    <reporter username="ethz.support">ETHz Support</reporter>
                        <labels>
                            <label>LB</label>
                    </labels>
                <created>Fri, 15 Mar 2013 05:40:00 +0000</created>
                <updated>Thu, 28 Mar 2013 14:35:19 +0000</updated>
                            <resolved>Thu, 28 Mar 2013 14:35:19 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                                    <fixVersion>Lustre 2.4.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>5</watches>
                                                                            <comments>
                            <comment id="54220" author="pjones" created="Sun, 17 Mar 2013 15:33:20 +0000"  >&lt;p&gt;Adrian&lt;/p&gt;

&lt;p&gt;Do I understand correctly that you are running a pre-release version of 2.4 in production? &lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="54221" author="adrian" created="Sun, 17 Mar 2013 16:58:59 +0000"  >&lt;p&gt;Yes, our compute nodes/clients are running git-versions of the lustre client (The servers are running stock 2.2.0 - we will ugprade them to 2.4.0 after the release)&lt;/p&gt;

&lt;p&gt;I am aware of the fact that this might not be a good idea (well, someone has to test it &lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/wink.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;) - but the 2_3 git releases turned out to be MUCH more stable than the official 2.2 and 2.3 client releases. Our users managed to crash 2.2 client nodes multiple times per day - with 2.3 we still had about 5-6 kernel panics per week while we are down to ~1 panic per week with the current GIT version.&lt;/p&gt;</comment>
                            <comment id="54222" author="pjones" created="Sun, 17 Mar 2013 17:19:24 +0000"  >&lt;p&gt;Adrian&lt;/p&gt;

&lt;p&gt;As long as you are aware of the risks of running pre-release software then of course I am delighted that we are able to get feedback from a real production environment - 2.4 will be a better release for it. &lt;/p&gt;

&lt;p&gt;While the focus of feature releases is always the new features provided, we also include all known bugfixes and the vast majority of the issues exposed by sites running 2.x releases have been issues in the underlying 2.0 code that we have built upon, rather than regressions associated with the new features. So, while I am disappointed to hear that you have had poor stability with 2.2 and 2.3 (others have reported a far better experience), I am not surprised to hear that things have been improving.&lt;/p&gt;

&lt;p&gt;Do you mind if I mention publicly (on updates to the mailing lists, in presentations about Lustre 2.4) that ETHZ is doing this?&lt;/p&gt;

&lt;p&gt;Oleg&lt;/p&gt;

&lt;p&gt;Could you please review this report and advise next steps? Is there enough to work with here? If not, can you advise what Adrian should collect in the event of a future reoccurence?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="54223" author="adrian" created="Sun, 17 Mar 2013 18:57:57 +0000"  >&lt;p&gt;&amp;gt; Do you mind if I mention publicly (on updates to the mailing lists, in presentations about Lustre 2.4) that ETHZ is doing this?&lt;/p&gt;

&lt;p&gt;I don&apos;t mind: That&apos;s fine with me.&lt;/p&gt;</comment>
                            <comment id="54224" author="pjones" created="Sun, 17 Mar 2013 19:01:31 +0000"  >&lt;p&gt;Great - thanks Adrian!&lt;/p&gt;</comment>
                            <comment id="54290" author="adilger" created="Mon, 18 Mar 2013 19:00:38 +0000"  >&lt;p&gt;Jinshan, can you please take a look at this to see if anything is obvious?&lt;/p&gt;</comment>
                            <comment id="54293" author="jay" created="Mon, 18 Mar 2013 19:18:49 +0000"  >&lt;p&gt;Obviously the object was already freed when this issue happened. Hmm.. did you set up crashdump on the machine or it&apos;s impossible to collect lustre log?&lt;/p&gt;</comment>
                            <comment id="54388" author="green" created="Tue, 19 Mar 2013 16:56:49 +0000"  >&lt;p&gt;I hit a very similar bug last Sunday. have crashdump in /exports/crashdumps/192.168.10.218-2013-03-17-21\:29\:49/&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;[363112.577950] general protection fault: 0000 [#1] SMP DEBUG_PAGEALLOC
[363112.578318] last sysfs file: /sys/devices/system/cpu/possible
[363112.578589] CPU 1
[363112.578637] Modules linked in: lustre ofd osp lod ost mdt osd_ldiskfs fsfilt_
ldiskfs ldiskfs mdd mgs lquota obdecho mgc lov osc mdc lmv fid fld ptlrpc obdclas
s lvfs ksocklnd lnet libcfs exportfs jbd sha512_generic sha256_generic ext4 mbcac
he jbd2 virtio_balloon virtio_console i2c_piix4 i2c_core virtio_blk virtio_net vi
rtio_pci virtio_ring virtio pata_acpi ata_generic ata_piix dm_mirror dm_region_ha
sh dm_log dm_mod nfs lockd fscache nfs_acl auth_rpcgss sunrpc be2iscsi bnx2i cnic
 uio ipv6 cxgb3i libcxgbi cxgb3 mdio libiscsi_tcp qla4xxx iscsi_boot_sysfs libisc
si scsi_transport_iscsi [last unloaded: libcfs]
[363112.580600]
[363112.580600] Pid: 451, comm: ldlm_bl_45 Not tainted 2.6.32-debug #6 Bochs Boch
s
[363112.580600] RIP: 0010:[&amp;lt;ffffffffa0f9c90b&amp;gt;]  [&amp;lt;ffffffffa0f9c90b&amp;gt;] cl_object_to
p+0x1b/0x150 [obdclass]
[363112.580600] RSP: 0018:ffff88009e0edb90  EFLAGS: 00010206
[363112.580600] RAX: 000130b38d4c0000 RBX: ffff88000bfb1db0 RCX: ffff880080abef60
[363112.580600] RDX: 000130b38d4c0000 RSI: ffffffffa04b1940 RDI: ffff88004ee8deb0
[363112.580600] RBP: ffff88009e0edba0 R08: 0000000000000000 R09: 0000000000000000
[363112.580600] R10: 0000000000000003 R11: 000000000000000f R12: ffff8800a89e6f30
[363112.580600] R13: ffff88003e04df50 R14: ffff88004ee8deb0 R15: ffff8800790bbc18
[363112.580600] FS:  00007f8c05205700(0000) GS:ffff880006280000(0000) knlGS:0000000000000000
[363112.580600] CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
[363112.580600] CR2: 00007ff2a83e2cf6 CR3: 0000000072edd000 CR4: 00000000000006e0
[363112.580600] DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
[363112.580600] DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
[363112.587593] Process ldlm_bl_45 (pid: 451, threadinfo ffff88009e0ec000, task ffff880088694440)
[363112.587593] Stack:
[363112.587593]  ffff88009e0edbb0 ffff88000bfb1db0 ffff88009e0edbb0 ffffffffa0f9ca4e
[363112.587593] &amp;lt;d&amp;gt; ffff88009e0edbf0 ffffffffa0488788 0000000000000002 ffff88003e04df50 
[363112.587593] &amp;lt;d&amp;gt; ffff88003e04df50 ffff8800a89e6f30 ffff8800a89e6f30 ffff88009e0edca0 
[363112.587593] Call Trace:
[363112.587593]  [&amp;lt;ffffffffa0f9ca4e&amp;gt;] cl_object_attr_lock+0xe/0x20 [obdclass]
[363112.587593]  [&amp;lt;ffffffffa0488788&amp;gt;] osc_lock_detach+0xe8/0x1a0 [osc]
[363112.587593]  [&amp;lt;ffffffffa0488888&amp;gt;] osc_lock_delete+0x48/0xc0 [osc]
[363112.587593]  [&amp;lt;ffffffffa0fa4ce5&amp;gt;] cl_lock_delete0+0xb5/0x1d0 [obdclass]
[363112.587593]  [&amp;lt;ffffffffa0fa4f53&amp;gt;] cl_lock_delete+0x153/0x1a0 [obdclass]
[363112.587593]  [&amp;lt;ffffffffa048a4f6&amp;gt;] osc_ldlm_blocking_ast+0x146/0x350 [osc]
[363112.587593]  [&amp;lt;ffffffffa10c906c&amp;gt;] ldlm_cancel_callback+0x6c/0x1a0 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffffa10e30da&amp;gt;] ldlm_cli_cancel_local+0x8a/0x470 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffffa10e7bd0&amp;gt;] ldlm_cli_cancel+0x60/0x360 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffffa0488ede&amp;gt;] osc_lock_cancel+0xfe/0x1c0 [osc]
[363112.587593]  [&amp;lt;ffffffffa0fa37c5&amp;gt;] cl_lock_cancel0+0x75/0x160 [obdclass]
[363112.587593]  [&amp;lt;ffffffffa0fa436b&amp;gt;] cl_lock_cancel+0x13b/0x140 [obdclass]
[363112.587593]  [&amp;lt;ffffffffa048a4ea&amp;gt;] osc_ldlm_blocking_ast+0x13a/0x350 [osc]
[363112.587593]  [&amp;lt;ffffffffa10eb970&amp;gt;] ldlm_handle_bl_callback+0x130/0x400 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffffa10ebec9&amp;gt;] ldlm_bl_thread_main+0x289/0x3e0 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffff81057d60&amp;gt;] ? default_wake_function+0x0/0x20
[363112.587593]  [&amp;lt;ffffffffa10ebc40&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffff8100c14a&amp;gt;] child_rip+0xa/0x20
[363112.587593]  [&amp;lt;ffffffffa10ebc40&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffffa10ebc40&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3e0 [ptlrpc]
[363112.587593]  [&amp;lt;ffffffff8100c140&amp;gt;] ? child_rip+0x0/0x20
[363112.587593] Code: c7 a0 e2 fe a0 e8 e6 95 e9 ff 66 0f 1f 44 00 00 55 48 89 e5 53 48 83 ec 08 0f 1f 44 00 00 48 8b 07 0f 1f 80 00 00 00 00 48 89 c2 &amp;lt;48&amp;gt; 8b 80 b0 00 00 00 48 85 c0 75 f1 48 8b 42 48 48 83 c2 48 48
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="54391" author="green" created="Tue, 19 Mar 2013 17:02:50 +0000"  >&lt;p&gt;Adrian, with panics once per week, any other interesting panics you happen to have that you can share with us?&lt;/p&gt;</comment>
                            <comment id="54447" author="adrian" created="Wed, 20 Mar 2013 07:51:46 +0000"  >&lt;p&gt;@ Jinshan Xiong&lt;br/&gt;
&amp;gt; Hmm.. did you set up crashdump on the machine or it&apos;s impossible to collect lustre log?&lt;/p&gt;

&lt;p&gt;Unfortunately, crashdump was not enabled on this kind of node. It is now enabled and i should be able to provide a crashdump if it happens again&lt;/p&gt;

&lt;p&gt;@ Oleg Drokin&lt;br/&gt;
&amp;gt; Adrian, with panics once per week, any other interesting panics you happen to have that you can share with us?&lt;/p&gt;

&lt;p&gt;No, i don&apos;t have any other interesting panics right now &lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/smile.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;br/&gt;
All other &apos;recent&apos; crashes happened on nodes with some older version of the lustre client (and in most cases it was already fixed in the -git version).&lt;br/&gt;
This was our first crash with 2_3_61&lt;/p&gt;</comment>
                            <comment id="54489" author="jay" created="Wed, 20 Mar 2013 17:22:57 +0000"  >&lt;p&gt;Hi Adrian, I&apos;m going to work out a debug patch. From the symptom so far, the top object was freed while a sublock was still being canceled. This must be race but I need more information.&lt;/p&gt;</comment>
                            <comment id="54535" author="jay" created="Thu, 21 Mar 2013 06:07:39 +0000"  >&lt;p&gt;I;ve known the root cause of this problem, will compose a patch.&lt;/p&gt;</comment>
                            <comment id="54676" author="jay" created="Fri, 22 Mar 2013 17:33:56 +0000"  >&lt;p&gt;patch is at: &lt;a href=&quot;http://review.whamcloud.com/5812&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/5812&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="54744" author="adrian" created="Mon, 25 Mar 2013 10:01:12 +0000"  >&lt;p&gt;Thanks! I&apos;ll rebuild our client-RPM with the patch included ASAP.&lt;/p&gt;</comment>
                            <comment id="55005" author="pjones" created="Thu, 28 Mar 2013 14:35:19 +0000"  >&lt;p&gt;Landed for 2.4&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvlfz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>7239</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>