<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:21:19 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1976] SWL - mds hard crash </title>
                <link>https://jira.whamcloud.com/browse/LU-1976</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Console &lt;span class=&quot;error&quot;&gt;&amp;#91;hyperion-rst6&amp;#93;&lt;/span&gt; log at 2012-09-18 18:00:00 PDT.&lt;br/&gt;
2012-09-18 18:04:56 Lustre: lustre-MDT0000: haven&apos;t heard from client 3beba6a9-a86c-e3b3-e02d-311fe4e1c5ec (at 192.168.118.135@o2ib1) in 227 seconds. I think it&apos;s dead, and I am evicting it. exp ffff880288182400, cur 1348016696 expire 1348016546 last 1348016469&lt;br/&gt;
2012-09-18 18:17:21 BUG: unable to handle kernel paging request at 000000008a5e6591&lt;br/&gt;
2012-09-18 18:17:21 IP: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0855018&amp;gt;&amp;#93;&lt;/span&gt; unlock_res_and_lock+0x18/0x40 &lt;span class=&quot;error&quot;&gt;&amp;#91;ptlrpc&amp;#93;&lt;/span&gt;&lt;br/&gt;
2012-09-18 18:17:21 PGD 0&lt;br/&gt;
2012-09-18 18:17:21 BUG: unable to handle kernel NULL pointer dereference at 0000000000000068&lt;br/&gt;
2012-09-18 18:17:21 IP: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81043b49&amp;gt;&amp;#93;&lt;/span&gt; no_context+0x99/0x260&lt;/p&gt;

&lt;p&gt;MDS fails to dump a stack, but does dump vmcore. at the same time one client dumped vmcore. both dumps are on brent ~cliffw/hyperion/&lt;/p&gt;</description>
                <environment></environment>
        <key id="16035">LU-1976</key>
            <summary>SWL - mds hard crash </summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="1" iconUrl="https://jira.whamcloud.com/images/icons/priorities/blocker.svg">Blocker</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="yong.fan">nasf</assignee>
                                    <reporter username="cliffw">Cliff White</reporter>
                        <labels>
                    </labels>
                <created>Tue, 18 Sep 2012 21:29:51 +0000</created>
                <updated>Mon, 3 Dec 2012 15:04:43 +0000</updated>
                            <resolved>Sat, 22 Sep 2012 01:13:22 +0000</resolved>
                                    <version>Lustre 2.3.0</version>
                                    <fixVersion>Lustre 2.3.0</fixVersion>
                    <fixVersion>Lustre 2.4.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="45179" author="cliffw" created="Tue, 18 Sep 2012 21:40:32 +0000"  >&lt;p&gt;Kernel backtrace, MDS:&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;
 bt
PID: 4898   TASK: ffff88012df62080  CPU: 7   COMMAND: &lt;span class=&quot;code-quote&quot;&gt;&quot;mdt03_008&quot;&lt;/span&gt;
 #0 [ffff880121e932b0] machine_kexec at ffffffff8103281b
 #1 [ffff880121e93310] crash_kexec at ffffffff810ba792
 #2 [ffff880121e933e0] oops_end at ffffffff81501700
 #3 [ffff880121e93410] die at ffffffff8100f26b
 #4 [ffff880121e93440] do_trap at ffffffff81500ff4
 #5 [ffff880121e934a0] do_invalid_op at ffffffff8100ce35
 #6 [ffff880121e93540] invalid_op at ffffffff8100bedb
    [exception RIP: add_dirent_to_buf+1216]
    RIP: ffffffffa0db21d0  RSP: ffff880121e935f0  RFLAGS: 00010246
    RAX: ffff880181248000  RBX: ffff880268654078  RCX: 00000000000014b5
    RDX: ffff880268654098  RSI: 0000000000000046  RDI: ffff88016ff93c00
    RBP: ffff880121e936b0   R8: 0000000000000000   R9: 0000000000000000
    R10: 0000000000000001  R11: 0000000000000000  R12: ffff880130e16ad0
    R13: 0000000000000000  R14: 0000000000000004  R15: 0000000000000020
    ORIG_RAX: ffffffffffffffff  CS: 0010  SS: 0018
 #7 [ffff880121e936b8] ldiskfs_add_entry at ffffffffa0db5c5d [ldiskfs]
 #8 [ffff880121e93758] __osd_ea_add_rec at ffffffffa1001689 [osd_ldiskfs]
 #9 [ffff880121e937a8] osd_index_ea_insert at ffffffffa100dbeb [osd_ldiskfs]
#10 [ffff880121e93838] __mdd_index_insert_only at ffffffffa0eee977 [mdd]
#11 [ffff880121e93898] __mdd_index_insert at ffffffffa0eef9b1 [mdd]
#12 [ffff880121e938e8] mdd_create at ffffffffa0ef55e3 [mdd]
#13 [ffff880121e93a28] cml_create at ffffffffa06a4637 [cmm]
#14 [ffff880121e93a78] mdt_reint_open at ffffffffa0f8bb9f [mdt]
#15 [ffff880121e93b48] mdt_reint_rec at ffffffffa0f75151 [mdt]
#16 [ffff880121e93b68] mdt_reint_internal at ffffffffa0f6e9aa [mdt]
#17 [ffff880121e93bb8] mdt_intent_reint at ffffffffa0f6ef7d [mdt]
#18 [ffff880121e93c08] mdt_intent_policy at ffffffffa0f6b191 [mdt]
#19 [ffff880121e93c48] ldlm_lock_enqueue at ffffffffa0859881 [ptlrpc]
#20 [ffff880121e93ca8] ldlm_handle_enqueue0 at ffffffffa08819bf [ptlrpc]
#21 [ffff880121e93d18] mdt_enqueue at ffffffffa0f6b506 [mdt]
#22 [ffff880121e93d38] mdt_handle_common at ffffffffa0f62802 [mdt]
#23 [ffff880121e93d88] mdt_regular_handle at ffffffffa0f636f5 [mdt]
#24 [ffff880121e93d98] ptlrpc_server_handle_request at ffffffffa08b199d [ptlrpc]
#25 [ffff880121e93e98] ptlrpc_main at ffffffffa08b2f89 [ptlrpc]
#26 [ffff880121e93f48] kernel_thread at ffffffff8100c14a
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</comment>
                            <comment id="45219" author="pjones" created="Wed, 19 Sep 2012 09:27:10 +0000"  >&lt;p&gt;Bobijam&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="45223" author="pjones" created="Wed, 19 Sep 2012 10:05:17 +0000"  >&lt;p&gt;Fanyong&lt;/p&gt;

&lt;p&gt;Oleg suggested that this might be a good ticket for you to look into&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="45269" author="yong.fan" created="Thu, 20 Sep 2012 12:09:40 +0000"  >&lt;p&gt;One possible reason may cause such failure: when multiple threads try to recycle empty OI leaves concurrently, the race among those threads may cause some OI index node(s) crazy. Especially when there are some index node(s) split threads in parallel, the cases will become more complex. The crazy OI index node(s) may cause memory crash. That may be why there are some strange failures recently.&lt;/p&gt;

&lt;p&gt;I am making patch to fix such issue.&lt;/p&gt;

&lt;p&gt;OI related codes are really bombs &lt;img class=&quot;emoticon&quot; src=&quot;https://jira.whamcloud.com/images/icons/emoticons/sad.png&quot; height=&quot;16&quot; width=&quot;16&quot; align=&quot;absmiddle&quot; alt=&quot;&quot; border=&quot;0&quot;/&gt;&lt;/p&gt;</comment>
                            <comment id="45314" author="yong.fan" created="Thu, 20 Sep 2012 23:02:10 +0000"  >&lt;p&gt;This is the patch:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/#change,4061&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,4061&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="45383" author="pjones" created="Sat, 22 Sep 2012 01:13:22 +0000"  >&lt;p&gt;Landed for 2.3 and 2.4&lt;/p&gt;</comment>
                            <comment id="48691" author="bogl" created="Mon, 3 Dec 2012 15:04:43 +0000"  >&lt;p&gt;back port to b2_1&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/#change,4735&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,4735&lt;/a&gt;&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzv5hz:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>4425</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>