<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:04:43 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-195] OSS nodes hung due to multiple threads spinning on dq_list_lock with Lustre quotas enabled</title>
                <link>https://jira.whamcloud.com/browse/LU-195</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;At CEA they sometimes have multiple OSS nodes completely hang. Those nodes are dead and need to be crashed.&lt;/p&gt;

&lt;p&gt;In the dump, they see that multiple tasks are spinning on &quot;dq_list_lock&quot; with the following stack traces:&lt;br/&gt;
============================================================================&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859180&amp;#93;&lt;/span&gt; _spin_lock at ffffffff81454fee&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859188&amp;#93;&lt;/span&gt; dqget at ffffffff811b0914&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf8591d8&amp;#93;&lt;/span&gt; vfs_get_dqblk at ffffffff811b0f5a&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf8591f8&amp;#93;&lt;/span&gt; fsfilt_ldiskfs_quotactl at ffffffffa03fcbff&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf8592a8&amp;#93;&lt;/span&gt; compute_remquota at ffffffffa07cb7ce&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859328&amp;#93;&lt;/span&gt; quota_check_common at ffffffffa07d4ade&lt;br/&gt;
#13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859468&amp;#93;&lt;/span&gt; quota_chk_acq_common at ffffffffa07d5561&lt;br/&gt;
#14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf8595e8&amp;#93;&lt;/span&gt; filter_commitrw_write at ffffffffa0797488&lt;br/&gt;
#15 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf8597d8&amp;#93;&lt;/span&gt; filter_commitrw at ffffffffa078a535&lt;br/&gt;
#16 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859898&amp;#93;&lt;/span&gt; obd_commitrw at ffffffffa0655ffa&lt;br/&gt;
#17 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859918&amp;#93;&lt;/span&gt; ost_brw_write at ffffffffa065e644&lt;br/&gt;
#18 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859af8&amp;#93;&lt;/span&gt; ost_handle at ffffffffa066337a&lt;br/&gt;
#19 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859ca8&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa06c5b11&lt;br/&gt;
#20 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859de8&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa06c6f0a&lt;br/&gt;
#21 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8805cf859f48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100d1aa&lt;/p&gt;

&lt;p&gt;and &lt;/p&gt;

&lt;p&gt; #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e59817d0&amp;#93;&lt;/span&gt; _spin_lock at ffffffff81454fee&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e59817d8&amp;#93;&lt;/span&gt; dqget at ffffffff811b0914&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981828&amp;#93;&lt;/span&gt; dquot_initialize at ffffffff811b1077&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981898&amp;#93;&lt;/span&gt; filter_destroy at ffffffffa0779496&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981a78&amp;#93;&lt;/span&gt; ost_destroy at ffffffffa0656de3&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981af8&amp;#93;&lt;/span&gt; ost_handle at ffffffffa066252b&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981ca8&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa06c5b11&lt;br/&gt;
#13 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981de8&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa06c6f0a&lt;br/&gt;
#14 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff8804e5981f48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100d1aa&lt;br/&gt;
============================================================================&lt;/p&gt;


&lt;p&gt;when the one who owns the &quot;dq_list_lock&quot; is spinning forever with the following stack trace:&lt;br/&gt;
============================================================================&lt;br/&gt;
 #6 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdeb8c0&amp;#93;&lt;/span&gt; vfs_quota_sync at ffffffff811b128b&lt;br/&gt;
 #7 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdeb918&amp;#93;&lt;/span&gt; fsfilt_ldiskfs_quotactl at ffffffffa03fc6fe&lt;br/&gt;
 #8 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdeb9c8&amp;#93;&lt;/span&gt; filter_quota_ctl at ffffffffa07d1bc2&lt;br/&gt;
 #9 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdebaf8&amp;#93;&lt;/span&gt; ost_handle at ffffffffa06627d9&lt;br/&gt;
#10 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdebca8&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request at ffffffffa06c5b11&lt;br/&gt;
#11 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdebde8&amp;#93;&lt;/span&gt; ptlrpc_main at ffffffffa06c6f0a&lt;br/&gt;
#12 &lt;span class=&quot;error&quot;&gt;&amp;#91;ffff88039cdebf48&amp;#93;&lt;/span&gt; kernel_thread at ffffffff8100d1aa&lt;br/&gt;
============================================================================&lt;/p&gt;


&lt;p&gt;We can also see that a (struct super_block *)-&amp;gt;s_dquot.info&lt;span class=&quot;error&quot;&gt;&amp;#91;cnt&amp;#93;&lt;/span&gt;.dqi_dirty_list list contains a single &quot;struct dquot&quot; having its dq_dirty.new pointing to itself and also its dq_flags with both DQ_ACTIVE_B and DQ_MOD_B bits unset. It seems that this is leading to an infinite loop in vfs_quota_sync()/clear_dquot_dirty().&lt;/p&gt;

&lt;p&gt;So maybe there is a place (in the kernel or Lustre) where a dqot struct can be chained or unchained on the dqi_dirty_list without the protection of &quot;dq_list_lock&quot;.&lt;/p&gt;


&lt;p&gt;On the OSSes, we also see very often the following messages in the syslog:&lt;/p&gt;

&lt;p&gt;2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: -----------&lt;del&gt;[ cut here ]&lt;/del&gt;-----------&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: WARNING: at lib/list_debug.c:26 __list_add+0x6d/0xa0() (Tainted: GF       W )&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: Hardware name: bullx super-node&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: list_add corruption. next-&amp;gt;prev should be prev (ffff88087da265c0), but was ffff88087c9bb2b0. (n&lt;br/&gt;
ext=ffff88087c9bb2b0).&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: Modules linked in: iptable_filter(U) ip_tables(U) x_tables(U) obdfilter(U) fsfilt_ldiskfs(U) os&lt;br/&gt;
t(U) mgc(U) ldiskfs(U) jbd2(U) lustre(U) lov(U) osc(U) mdc(U) lquota(U) fid(U) fld(U) ko2iblnd(U) ptlrpc(U) obdclass(U) lnet(U) lvfs(U) libcfs(F)(U)&lt;br/&gt;
 lpfc(U) scsi_transport_fc(U) scsi_tgt(U) nfs(U) lockd(U) fscache(U) nfs_acl(U) auth_rpcgss(U) sunrpc(U) cpufreq_ondemand(U) acpi_cpufreq(U) freq_ta&lt;br/&gt;
ble(U) rdma_ucm(U) ib_sdp(U) rdma_cm(U) iw_cm(U) ib_addr(U) ib_ipoib(U) ib_cm(U) ib_sa(U) ipv6(U) ib_uverbs(U) ib_umad(U) mlx4_ib(U) ib_mthca(U) ib_&lt;br/&gt;
mad(U) ib_core(U) usbhid(U) hid(U) mlx4_core(U) igb(U) ioatdma(U) i2c_i801(U) sg(U) i2c_core(U) uhci_hcd(U) dca(U) ehci_hcd(U) iTCO_wdt(U) iTCO_vend&lt;br/&gt;
or_support(U) ext3(U) jbd(U) mbcache(U) sd_mod(U) crc_t10dif(U) ahci(U) dm_mod(U) &lt;span class=&quot;error&quot;&gt;&amp;#91;last unloaded: scsi_tgt&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: Pid: 10660, comm: ll_ost_io_185 Tainted: GF       W  2.6.32-30.el6.Bull.16.x86_64 #1&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: Call Trace:&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105caa3&amp;gt;&amp;#93;&lt;/span&gt; warn_slowpath_common+0x83/0xc0&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105cb41&amp;gt;&amp;#93;&lt;/span&gt; warn_slowpath_fmt+0x41/0x50&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8124ca5d&amp;gt;&amp;#93;&lt;/span&gt; __list_add+0x6d/0xa0&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811aef9d&amp;gt;&amp;#93;&lt;/span&gt; dquot_mark_dquot_dirty+0x5d/0x70&lt;br/&gt;
2011-03-31 11:38:17 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa087f251&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_mark_dquot_dirty+0x31/0x60 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811af887&amp;gt;&amp;#93;&lt;/span&gt; __dquot_free_space+0x197/0x2f0&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811afa10&amp;gt;&amp;#93;&lt;/span&gt; dquot_free_space+0x10/0x20&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa084b3a3&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_free_blocks+0xf3/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa085033e&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_ext_truncate+0x82e/0x9c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811106e2&amp;gt;&amp;#93;&lt;/span&gt; ? pagevec_lookup+0x22/0x30&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa085cfc8&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_truncate+0x4c8/0x660 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa084d43b&amp;gt;&amp;#93;&lt;/span&gt; ? __ldiskfs_handle_dirty_metadata+0x7b/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8112303b&amp;gt;&amp;#93;&lt;/span&gt; ? unmap_mapping_range+0x6b/0x140&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81111ebe&amp;gt;&amp;#93;&lt;/span&gt; vmtruncate+0x5e/0x70&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811729c5&amp;gt;&amp;#93;&lt;/span&gt; inode_setattr+0x35/0x170&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa085dba6&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_setattr+0x186/0x390 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08c500e&amp;gt;&amp;#93;&lt;/span&gt; fsfilt_ldiskfs_setattr+0x17e/0x200 &lt;span class=&quot;error&quot;&gt;&amp;#91;fsfilt_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810fee3f&amp;gt;&amp;#93;&lt;/span&gt; ? find_or_create_page+0x3f/0xb0&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08f0fd4&amp;gt;&amp;#93;&lt;/span&gt; filter_setattr_internal+0xcc4/0x22c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08de14f&amp;gt;&amp;#93;&lt;/span&gt; ? filter_fmd_find_nolock+0x24f/0x2f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08d6633&amp;gt;&amp;#93;&lt;/span&gt; ? filter_fmd_put+0x33/0x190 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00f4dc1&amp;gt;&amp;#93;&lt;/span&gt; ? push_ctxt+0x281/0x3e0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lvfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08f272d&amp;gt;&amp;#93;&lt;/span&gt; filter_setattr+0x15d/0x610 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0600e0b&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_pack_reply_v2+0x23b/0x310 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ffc65&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_buf+0x85/0x90 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa062ba7b&amp;gt;&amp;#93;&lt;/span&gt; ? __req_capsule_get+0x14b/0x6b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0600fb1&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_pack_reply_flags+0xd1/0x1f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08f2cb9&amp;gt;&amp;#93;&lt;/span&gt; filter_truncate+0xd9/0x290 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00f973c&amp;gt;&amp;#93;&lt;/span&gt; ? lprocfs_counter_add+0x12c/0x170 &lt;span class=&quot;error&quot;&gt;&amp;#91;lvfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08b0741&amp;gt;&amp;#93;&lt;/span&gt; ost_punch+0x2a1/0x8c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06019dc&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_version+0x7c/0xe0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ff884&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_opc+0x94/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0601b9c&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_conn_cnt+0x7c/0xe0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08b86b0&amp;gt;&amp;#93;&lt;/span&gt; ost_handle+0x31d0/0x4f40 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8124a390&amp;gt;&amp;#93;&lt;/span&gt; ? __bitmap_weight+0x50/0xb0&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ff884&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_opc+0x94/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa060eb11&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request+0x421/0xef0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104079e&amp;gt;&amp;#93;&lt;/span&gt; ? activate_task+0x2e/0x40&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e0b6&amp;gt;&amp;#93;&lt;/span&gt; ? try_to_wake_up+0x286/0x380&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e1c2&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x12/0x20&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81041059&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up_common+0x59/0x90&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa012c5ae&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_timer_arm+0xe/0x10 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa060ff0a&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0x92a/0x15b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e1b0&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100d1aa&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa060f5e0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x15b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100d1a0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
2011-03-31 11:38:18 Mar 31 11:38:17 node206 kernel: --&lt;del&gt;[ end trace bb3c2f07eefda023 ]&lt;/del&gt;--&lt;/p&gt;

&lt;p&gt;..........&lt;/p&gt;

&lt;p&gt;2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: -----------&lt;del&gt;[ cut here ]&lt;/del&gt;-----------&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: WARNING: at lib/list_debug.c:26 __list_add+0x6d/0xa0() (Tainted: GF       W )&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: Hardware name: bullx super-node&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: list_add corruption. next-&amp;gt;prev should be prev (ffff88087da265c0), but was ffff88087c9bb2b0. (n&lt;br/&gt;
ext=ffff88087c9bb2b0).&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: Modules linked in: iptable_filter(U) ip_tables(U) x_tables(U) obdfilter(U) fsfilt_ldiskfs(U) os&lt;br/&gt;
t(U) mgc(U) ldiskfs(U) jbd2(U) lustre(U) lov(U) osc(U) mdc(U) lquota(U) fid(U) fld(U) ko2iblnd(U) ptlrpc(U) obdclass(U) lnet(U) lvfs(U) libcfs(F)(U)&lt;br/&gt;
 lpfc(U) scsi_transport_fc(U) scsi_tgt(U) nfs(U) lockd(U) fscache(U) nfs_acl(U) auth_rpcgss(U) sunrpc(U) cpufreq_ondemand(U) acpi_cpufreq(U) freq_ta&lt;br/&gt;
ble(U) rdma_ucm(U) ib_sdp(U) rdma_cm(U) iw_cm(U) ib_addr(U) ib_ipoib(U) ib_cm(U) ib_sa(U) ipv6(U) ib_uverbs(U) ib_umad(U) mlx4_ib(U) ib_mthca(U) ib_&lt;br/&gt;
mad(U) ib_core(U) usbhid(U) hid(U) mlx4_core(U) igb(U) ioatdma(U) i2c_i801(U) sg(U) i2c_core(U) uhci_hcd(U) dca(U) ehci_hcd(U) iTCO_wdt(U) iTCO_vend&lt;br/&gt;
or_support(U) ext3(U) jbd(U) mbcache(U) sd_mod(U) crc_t10dif(U) ahci(U) dm_mod(U) &lt;span class=&quot;error&quot;&gt;&amp;#91;last unloaded: scsi_tgt&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: Pid: 20096, comm: ll_ost_io_45 Tainted: GF       W  2.6.32-30.el6.Bull.16.x86_64 #1&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: Call Trace:&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105caa3&amp;gt;&amp;#93;&lt;/span&gt; warn_slowpath_common+0x83/0xc0&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8105cb41&amp;gt;&amp;#93;&lt;/span&gt; warn_slowpath_fmt+0x41/0x50&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8124ca5d&amp;gt;&amp;#93;&lt;/span&gt; __list_add+0x6d/0xa0&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811aef9d&amp;gt;&amp;#93;&lt;/span&gt; dquot_mark_dquot_dirty+0x5d/0x70&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa087f251&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_mark_dquot_dirty+0x31/0x60 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811afb83&amp;gt;&amp;#93;&lt;/span&gt; __dquot_alloc_space+0x133/0x220&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81250078&amp;gt;&amp;#93;&lt;/span&gt; ? __percpu_counter_add+0x68/0x90&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811afc9e&amp;gt;&amp;#93;&lt;/span&gt; dquot_alloc_space+0xe/0x10&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0865e96&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_mb_new_blocks+0xf6/0x660 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81453c1e&amp;gt;&amp;#93;&lt;/span&gt; ? mutex_lock+0x1e/0x50&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811b0a7b&amp;gt;&amp;#93;&lt;/span&gt; ? dqget+0x1cb/0x380&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08c6d1b&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_ext_new_extent_cb+0x59b/0x6f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;fsfilt_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff811851cc&amp;gt;&amp;#93;&lt;/span&gt; ? __getblk+0x2c/0x2e0&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa084f7e9&amp;gt;&amp;#93;&lt;/span&gt; ldiskfs_ext_walk_space+0x109/0x2c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08c6780&amp;gt;&amp;#93;&lt;/span&gt; ? ldiskfs_ext_new_extent_cb+0x0/0x6f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;fsfilt_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08c644d&amp;gt;&amp;#93;&lt;/span&gt; fsfilt_map_nblocks+0xed/0x120 &lt;span class=&quot;error&quot;&gt;&amp;#91;fsfilt_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08c659b&amp;gt;&amp;#93;&lt;/span&gt; fsfilt_ldiskfs_map_ext_inode_pages+0x11b/0x260 &lt;span class=&quot;error&quot;&gt;&amp;#91;fsfilt_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff810cea15&amp;gt;&amp;#93;&lt;/span&gt; ? call_rcu_sched+0x15/0x20&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81088cad&amp;gt;&amp;#93;&lt;/span&gt; ? commit_creds+0x11d/0x1e0&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08c6775&amp;gt;&amp;#93;&lt;/span&gt; fsfilt_ldiskfs_map_inode_pages+0x95/0xa0 &lt;span class=&quot;error&quot;&gt;&amp;#91;fsfilt_ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa087efb8&amp;gt;&amp;#93;&lt;/span&gt; ? ldiskfs_journal_start_sb+0x58/0x90 &lt;span class=&quot;error&quot;&gt;&amp;#91;ldiskfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08ff4c5&amp;gt;&amp;#93;&lt;/span&gt; filter_do_bio+0xd75/0x1860 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0901bd8&amp;gt;&amp;#93;&lt;/span&gt; filter_commitrw_write+0x13d8/0x284c &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08f4535&amp;gt;&amp;#93;&lt;/span&gt; filter_commitrw+0x2c5/0x2f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ffc65&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_buf+0x85/0x90 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa062ba7b&amp;gt;&amp;#93;&lt;/span&gt; ? __req_capsule_get+0x14b/0x6b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00f973c&amp;gt;&amp;#93;&lt;/span&gt; ? lprocfs_counter_add+0x12c/0x170 &lt;span class=&quot;error&quot;&gt;&amp;#91;lvfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08abffa&amp;gt;&amp;#93;&lt;/span&gt; obd_commitrw+0x11a/0x410 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08b4644&amp;gt;&amp;#93;&lt;/span&gt; ost_brw_write+0xff4/0x1e90 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05f9e44&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_send_reply+0x284/0x6f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08f2cb9&amp;gt;&amp;#93;&lt;/span&gt; ? filter_truncate+0xd9/0x290 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdfilter&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa00f973c&amp;gt;&amp;#93;&lt;/span&gt; ? lprocfs_counter_add+0x12c/0x170 &lt;span class=&quot;error&quot;&gt;&amp;#91;lvfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e1b0&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ff884&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_opc+0x94/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa08b937a&amp;gt;&amp;#93;&lt;/span&gt; ost_handle+0x3e9a/0x4f40 &lt;span class=&quot;error&quot;&gt;&amp;#91;ost&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8124a390&amp;gt;&amp;#93;&lt;/span&gt; ? __bitmap_weight+0x50/0xb0&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa05ff884&amp;gt;&amp;#93;&lt;/span&gt; ? lustre_msg_get_opc+0x94/0x100 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa060eb11&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_server_handle_request+0x421/0xef0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104079e&amp;gt;&amp;#93;&lt;/span&gt; ? activate_task+0x2e/0x40&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e0b6&amp;gt;&amp;#93;&lt;/span&gt; ? try_to_wake_up+0x286/0x380&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e1c2&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x12/0x20&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81041059&amp;gt;&amp;#93;&lt;/span&gt; ? __wake_up_common+0x59/0x90&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa012c5ae&amp;gt;&amp;#93;&lt;/span&gt; ? cfs_timer_arm+0xe/0x10 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa060ff0a&amp;gt;&amp;#93;&lt;/span&gt; ptlrpc_main+0x92a/0x15b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8104e1b0&amp;gt;&amp;#93;&lt;/span&gt; ? default_wake_function+0x0/0x20&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100d1aa&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x20&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa060f5e0&amp;gt;&amp;#93;&lt;/span&gt; ? ptlrpc_main+0x0/0x15b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100d1a0&amp;gt;&amp;#93;&lt;/span&gt; ? child_rip+0x0/0x20&lt;br/&gt;
2011-04-02 10:59:08 Apr  2 10:59:08 node206 kernel: --&lt;del&gt;[ end trace bb3c2f07eefda100 ]&lt;/del&gt;--&lt;/p&gt;

&lt;p&gt;.........&lt;/p&gt;

&lt;p&gt;=============================================================&lt;/p&gt;



&lt;p&gt;To me, this problem looks very similar to bugzilla 22363. But it is strange that the fix for this bug was only landed in 1.8 branch. In comment 28 Andrew ays that master does not need it as it is a SLES11-only fix, but now that we support RHEL6 in master, is this still true?&lt;br/&gt;
And also, I noticed that the patch quota-support-64-bit-quota-format.patch is not applied in 2.6-rhel6.series file.&lt;/p&gt;

&lt;p&gt;What do you think?&lt;/p&gt;

&lt;p&gt;TIA,&lt;br/&gt;
Sebastien.&lt;/p&gt;</description>
                <environment></environment>
        <key id="10558">LU-195</key>
            <summary>OSS nodes hung due to multiple threads spinning on dq_list_lock with Lustre quotas enabled</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="5">Cannot Reproduce</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="sebastien.buisson">Sebastien Buisson</reporter>
                        <labels>
                    </labels>
                <created>Thu, 7 Apr 2011 00:48:28 +0000</created>
                <updated>Thu, 21 Apr 2011 07:26:24 +0000</updated>
                            <resolved>Thu, 21 Apr 2011 07:26:24 +0000</resolved>
                                    <version>Lustre 2.0.0</version>
                                    <fixVersion>Lustre 2.1.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="12536" author="johann" created="Thu, 7 Apr 2011 09:08:06 +0000"  >&lt;p&gt;This reminds me of bugzilla ticket 22363. Is this fix included in your RHEL6 kernel patch series?&lt;/p&gt;</comment>
                            <comment id="12555" author="pjones" created="Thu, 7 Apr 2011 10:23:12 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Can you please check whether we have the fix mentioned in our own RHEL6 patch series?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter &lt;/p&gt;</comment>
                            <comment id="12666" author="bobijam" created="Thu, 7 Apr 2011 21:43:42 +0000"  >&lt;p&gt;2.6.32-71.18.1.el6 kernel already contain 64 bit quota support and its do_set_dqblk() uses atomic set_bit() instead of __set_bit().&lt;/p&gt;</comment>
                            <comment id="12668" author="bobijam" created="Thu, 7 Apr 2011 22:18:23 +0000"  >&lt;p&gt;I checked 2.6.32-71.18.1.el6, dquot_mark_dquot_dirty() and clear_dquot_dirty() are all under dq_list_lock&apos;s protection, and DQ_MOD_B flag only set in dquot_mark_dquot_dirty() and only unset in clear_dquot_dirty(). It is strange that a dquot item with DQ_MOD_B flag unset while still on the super_block&apos;s dqi_dirty_list.&lt;/p&gt;</comment>
                            <comment id="12908" author="johann" created="Mon, 18 Apr 2011 08:45:09 +0000"  >&lt;p&gt;Bull, could you please confirm that your kernel also has the patch from bugzilla ticket 22363 applied?&lt;br/&gt;
If so, could you please give us the dump of the dquot structure which is still in the dirty list?&lt;/p&gt;</comment>
                            <comment id="13024" author="patrick.valentin" created="Tue, 19 Apr 2011 10:26:30 +0000"  >&lt;p&gt;The kernel sequence of code that was patched by BZ22363 for Lustre 1.8 in SLES11 is identical in RHEL6 kernel source (fs/quota/dquot.c), but we do not have the corresponding patch in our Lustre 2.0 source code.&lt;/p&gt;</comment>
                            <comment id="13175" author="patrick.valentin" created="Thu, 21 Apr 2011 04:33:19 +0000"  >&lt;p&gt;At CEA customer site, there are different kernel versions, depending on the server type:&lt;br/&gt;
	kernel-2.6.32-30.el6	&lt;br/&gt;
	kernel-2.6.32-71.14.1.el6&lt;br/&gt;
I checked the source code, and the fix (use of atomic set_bit() instead of __set_bit()) is only present in the latter.&lt;br/&gt;
The hang repported by the customer is on a server installed with the former (without the fix).&lt;br/&gt;
We are going to ask them, at the next meeting, if the problem only occurs on servers installed with the old kernel.&lt;/p&gt;</comment>
                            <comment id="13188" author="pjones" created="Thu, 21 Apr 2011 07:26:24 +0000"  >&lt;p&gt;As per update from Bull, this issue only occurs in pre-GA versions of RHEL6 without the previously mentioned adjustment so marking as RESOLVED. Please reopen if some further evidence is found to suggest that this is not the case.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvslr:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>8538</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>