<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:51:41 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-5460] Lustre client crash</title>
                <link>https://jira.whamcloud.com/browse/LU-5460</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Hi,&lt;/p&gt;

&lt;p&gt;One of our clients which exports Lustre over NFS crashed, dumped and rebooted overnight. I&apos;m including the vmcore-dmesg here in case there is anything useful for you. I don&apos;t think we&apos;ve seen this one before so it must be rare. Full vmcore available on request.&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;&amp;lt;4&amp;gt;general protection fault: 0000 [#1] SMP 
&amp;lt;4&amp;gt;last sysfs file: /sys/devices/system/node/node1/numastat
&amp;lt;4&amp;gt;CPU 21 
&amp;lt;4&amp;gt;Modules linked in: tcp_diag inet_diag mptctl mptbase ipmi_devintf dell_rbu nfsd exportfs autofs4 lmv(U) mgc(U) lustre(U) lov(U) osc(U) mdc(U) fid(U) fld(U) ksocklnd(U) ptlrpc(U) obdclass(U) lnet(U) lvfs(U) sha512_generic sha256_generic crc32c_intel libcfs(U) nfs lockd fscache auth_rpcgss nfs_acl sunrpc bonding 8021q garp stp llc ipv6 uinput raid456 async_raid6_recov async_pq raid6_pq async_xor xor async_memcpy async_tx power_meter sg bnx2x libcrc32c mdio bnx2 dcdbas microcode serio_raw iTCO_wdt iTCO_vendor_support i7core_edac edac_core ext3 jbd mbcache sr_mod cdrom sd_mod crc_t10dif pata_acpi ata_generic ata_piix mpt2sas scsi_transport_sas raid_class dm_mirror dm_region_hash dm_log dm_mod [last unloaded: scsi_wait_scan]
&amp;lt;4&amp;gt;
&amp;lt;4&amp;gt;Pid: 17387, comm: ldlm_bl_40 Not tainted 2.6.32-358.18.1.el6_lustre.x86_64 #1 Dell Inc. PowerEdge R610/0F0XJ6
&amp;lt;4&amp;gt;RIP: 0010:[&amp;lt;ffffffffa058ba3e&amp;gt;]  [&amp;lt;ffffffffa058ba3e&amp;gt;] cl_lock_mutex_get+0x2e/0xd0 [obdclass]
&amp;lt;4&amp;gt;RSP: 0018:ffff88046ec63c30  EFLAGS: 00010203
&amp;lt;4&amp;gt;RAX: 5a5a5a5a5a5a5a5a RBX: ffff880572210d10 RCX: ffff880a789650b8
&amp;lt;4&amp;gt;RDX: ffff8808e88c5448 RSI: ffff880a58758a18 RDI: ffff880572210d10
&amp;lt;4&amp;gt;RBP: ffff88046ec63c50 R08: ffffffffa05ab7ee R09: 0000000000000000
&amp;lt;4&amp;gt;R10: 5a5a5a5a5a5a5a5a R11: 5a5a5a5a5a5a5a5a R12: ffff880a58758a18
&amp;lt;4&amp;gt;R13: ffff88079d568678 R14: ffff880952923b70 R15: ffff880a58758a18
&amp;lt;4&amp;gt;FS:  00007ff150e51700(0000) GS:ffff880028340000(0000) knlGS:0000000000000000
&amp;lt;4&amp;gt;CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
&amp;lt;4&amp;gt;CR2: 00007ffbd6c4a9d4 CR3: 0000000c235b4000 CR4: 00000000000007e0
&amp;lt;4&amp;gt;DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
&amp;lt;4&amp;gt;DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
&amp;lt;4&amp;gt;&lt;span class=&quot;code-object&quot;&gt;Process&lt;/span&gt; ldlm_bl_40 (pid: 17387, threadinfo ffff88046ec62000, task ffff880bb62b0aa0)
&amp;lt;4&amp;gt;Stack:
&amp;lt;4&amp;gt; ffff880b4f421740 ffff880572210d10 ffff880a58758a18 ffff88079d568678
&amp;lt;4&amp;gt;&amp;lt;d&amp;gt; ffff88046ec63c70 ffffffffa0a014b9 ffff880572210d10 ffff8808e88c5420
&amp;lt;4&amp;gt;&amp;lt;d&amp;gt; ffff88046ec63cc0 ffffffffa0a01c39 ffff880b4f421740 ffff8808e88c5448
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a014b9&amp;gt;] lovsub_parent_lock+0x49/0x120 [lov]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0a01c39&amp;gt;] lovsub_lock_state+0x79/0x1b0 [lov]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0589718&amp;gt;] cl_lock_state_signal+0x68/0x160 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0589865&amp;gt;] cl_lock_state_set+0x55/0x190 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa058a8b3&amp;gt;] cl_lock_delete0+0x53/0x1d0 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa058ab83&amp;gt;] cl_lock_delete+0x153/0x1a0 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0968ac6&amp;gt;] osc_ldlm_blocking_ast+0x146/0x350 [osc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06b91bc&amp;gt;] ldlm_cancel_callback+0x6c/0x1a0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06d341a&amp;gt;] ldlm_cli_cancel_local+0x8a/0x470 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06d670e&amp;gt;] ldlm_cli_cancel_list_local+0xee/0x290 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06dc1b0&amp;gt;] ldlm_bl_thread_main+0x100/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff81063410&amp;gt;] ? default_wake_function+0x0/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06dc0b0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06dc0b0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06dc0b0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
&amp;lt;4&amp;gt;Code: e5 41 55 41 54 53 48 83 ec 08 0f 1f 44 00 00 65 48 8b 04 25 c0 cb 00 00 48 39 86 90 00 00 00 48 89 fb 49 89 f4 74 56 48 8b 46 28 &amp;lt;4c&amp;gt; 8b 28 e8 ba 58 ff ff 41 0f b6 b5 96 00 00 00 85 f6 74 23 8b 
&amp;lt;1&amp;gt;RIP  [&amp;lt;ffffffffa058ba3e&amp;gt;] cl_lock_mutex_get+0x2e/0xd0 [obdclass]
&amp;lt;4&amp;gt; RSP &amp;lt;ffff88046ec63c30&amp;gt;
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment></environment>
        <key id="25907">LU-5460</key>
            <summary>Lustre client crash</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="6" iconUrl="https://jira.whamcloud.com/images/icons/statuses/closed.png" description="The issue is considered finished, the resolution is correct. Issues which are closed can be reopened.">Closed</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="jay">Jinshan Xiong</assignee>
                                    <reporter username="daire">Daire Byrne</reporter>
                        <labels>
                    </labels>
                <created>Thu, 7 Aug 2014 11:04:51 +0000</created>
                <updated>Thu, 8 Feb 2018 18:28:27 +0000</updated>
                            <resolved>Thu, 8 Feb 2018 18:28:27 +0000</resolved>
                                    <version>Lustre 2.4.1</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="91066" author="jay" created="Thu, 7 Aug 2014 16:53:42 +0000"  >&lt;p&gt;Try this patch: &lt;a href=&quot;http://review.whamcloud.com/#/c/9876/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#/c/9876/&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="92145" author="daire" created="Thu, 21 Aug 2014 15:37:22 +0000"  >&lt;p&gt;We have not yet had an opportunity to try this patch but it looks like we just hit this again. A more complete vmcore-dmesg this time&lt;/p&gt;

&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;&amp;lt;3&amp;gt;LustreError: 16371:0:(dir.c:433:ll_get_dir_page()) read cache page: [0x200009459:0x129a8:0x0] at 3437219588190122278: rc -5
&amp;lt;4&amp;gt;general protection fault: 0000 [#1] SMP 
&amp;lt;4&amp;gt;last sysfs file: /sys/devices/pci0000:00/0000:00:1e.0/0000:06:03.0/local_cpus
&amp;lt;4&amp;gt;CPU 19 
&amp;lt;4&amp;gt;Modules linked in: tcp_diag inet_diag mptctl mptbase ipmi_devintf dell_rbu nfsd exportfs autofs4 lmv(U) mgc(U) lustre(U) lov(U) osc(U) mdc(U) fid(U) fld(U) ksocklnd(U) ptlrpc(U) obdclass(U) lnet(U) lvfs(U) sha512_generic sha256_generic crc32c_intel libcfs(U) nfs lockd fscache auth_rpcgss nfs_acl sunrpc bonding 8021q garp stp llc ipv6 uinput power_meter sg bnx2x libcrc32c mdio bnx2 dcdbas microcode serio_raw iTCO_wdt iTCO_vendor_support i7core_edac edac_core ext3 jbd mbcache sr_mod cdrom sd_mod crc_t10dif pata_acpi ata_generic ata_piix mpt2sas scsi_transport_sas raid_class dm_mirror dm_region_hash dm_log dm_mod [last unloaded: scsi_wait_scan]
&amp;lt;4&amp;gt;
&amp;lt;4&amp;gt;Pid: 5694, comm: ldlm_bl_24 Not tainted 2.6.32-358.18.1.el6_lustre.x86_64 #1 Dell Inc. PowerEdge R610/01W9FG
&amp;lt;4&amp;gt;RIP: 0010:[&amp;lt;ffffffffa053ba3e&amp;gt;]  [&amp;lt;ffffffffa053ba3e&amp;gt;] cl_lock_mutex_get+0x2e/0xd0 [obdclass]
&amp;lt;4&amp;gt;RSP: 0018:ffff8809688ffdf0  EFLAGS: 00010203
&amp;lt;4&amp;gt;RAX: 5a5a5a5a5a5a5a5a RBX: ffff88060a790338 RCX: 0000000000000000
&amp;lt;4&amp;gt;RDX: 0000000000000981 RSI: ffff880be73c6858 RDI: ffff88060a790338
&amp;lt;4&amp;gt;RBP: ffff8809688ffe10 R08: 0000000000000001 R09: 00000000ffffffff
&amp;lt;4&amp;gt;R10: 0000000000000000 R11: 0000000000000000 R12: ffff880be73c6858
&amp;lt;4&amp;gt;R13: ffff88060a790338 R14: ffff88074323d6c0 R15: ffff8809688ffe40
&amp;lt;4&amp;gt;FS:  00007f2c87cec700(0000) GS:ffff880028320000(0000) knlGS:0000000000000000
&amp;lt;4&amp;gt;CS:  0010 DS: 0000 ES: 0000 CR0: 000000008005003b
&amp;lt;4&amp;gt;CR2: 00007f3b43a71000 CR3: 00000006048f9000 CR4: 00000000000007e0
&amp;lt;4&amp;gt;DR0: 0000000000000000 DR1: 0000000000000000 DR2: 0000000000000000
&amp;lt;4&amp;gt;DR3: 0000000000000000 DR6: 00000000ffff0ff0 DR7: 0000000000000400
&amp;lt;4&amp;gt;&lt;span class=&quot;code-object&quot;&gt;Process&lt;/span&gt; ldlm_bl_24 (pid: 5694, threadinfo ffff8809688fe000, task ffff8808b1bbeaa0)
&amp;lt;4&amp;gt;Stack:
&amp;lt;4&amp;gt; ffff8809688ffe10 ffff880aee93b6c0 ffff88074323d6c0 ffff88060a790338
&amp;lt;4&amp;gt;&amp;lt;d&amp;gt; ffff8809688ffe80 ffffffffa09189fa ffff8808b1bbf058 ffff8809688fffd8
&amp;lt;4&amp;gt;&amp;lt;d&amp;gt; ffff880be73c6858 00000001b1bbf058 ffff880600000001 0000000000000000
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09189fa&amp;gt;] osc_ldlm_blocking_ast+0x7a/0x350 [osc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa068bde0&amp;gt;] ldlm_handle_bl_callback+0x130/0x400 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa068c331&amp;gt;] ldlm_bl_thread_main+0x281/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff81063410&amp;gt;] ? default_wake_function+0x0/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa068c0b0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa068c0b0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa068c0b0&amp;gt;] ? ldlm_bl_thread_main+0x0/0x3d0 [ptlrpc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
&amp;lt;4&amp;gt;Code: e5 41 55 41 54 53 48 83 ec 08 0f 1f 44 00 00 65 48 8b 04 25 c0 cb 00 00 48 39 86 90 00 00 00 48 89 fb 49 89 f4 74 56 48 8b 46 28 &amp;lt;4c&amp;gt; 8b 28 e8 ba 58 ff ff 41 0f b6 b5 96 00 00 00 85 f6 74 23 8b 
&amp;lt;1&amp;gt;RIP  [&amp;lt;ffffffffa053ba3e&amp;gt;] cl_lock_mutex_get+0x2e/0xd0 [obdclass]
&amp;lt;4&amp;gt; RSP &amp;lt;ffff8809688ffdf0&amp;gt;
&amp;lt;0&amp;gt;LustreError: 21790:0:(lovsub_lock.c:103:lovsub_lock_state()) ASSERTION( cl_lock_is_mutexed(slice-&amp;gt;cls_lock) ) failed: 
&amp;lt;0&amp;gt;LustreError: 21790:0:(lovsub_lock.c:103:lovsub_lock_state()) LBUG
&amp;lt;4&amp;gt;Pid: 21790, comm: ldlm_bl_76
&amp;lt;4&amp;gt;
&amp;lt;4&amp;gt;Call Trace:
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa03b7895&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa03b7e97&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa09b1d61&amp;gt;] lovsub_lock_state+0x1a1/0x1b0 [lov]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa03ccd94&amp;gt;] ? cfs_hash_dual_bd_unlock+0x34/0x60 [libcfs]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0539718&amp;gt;] cl_lock_state_signal+0x68/0x160 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0539865&amp;gt;] cl_lock_state_set+0x55/0x190 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa053a8b3&amp;gt;] cl_lock_delete0+0x53/0x1d0 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa053ab83&amp;gt;] cl_lock_delete+0x153/0x1a0 [obdclass]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa0918ac6&amp;gt;] osc_ldlm_blocking_ast+0x146/0x350 [osc]
&amp;lt;4&amp;gt; [&amp;lt;ffffffffa06691bc&amp;gt;] ldlm_cancel_callback+0x6c/0x1a0 [ptlrpc]
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="100545" author="daire" created="Wed, 3 Dec 2014 11:56:17 +0000"  >&lt;p&gt;We have not hit this again since applying the suggested patch. You can resolve the ticket. Cheers.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10490" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>End date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Wed, 3 Dec 2014 11:04:51 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                            <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzwt5b:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>15209</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                        <customfield id="customfield_10493" key="com.atlassian.jira.plugin.system.customfieldtypes:datepicker">
                        <customfieldname>Start date</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>Thu, 7 Aug 2014 11:04:51 +0000</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                    </customfields>
    </item>
</channel>
</rss>