<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:58:54 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-6286] During path failover KMMPD hangs updating mmp</title>
                <link>https://jira.whamcloud.com/browse/LU-6286</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;During SRP path failover kmmpd hangs which causes OSS require reboot.&lt;/p&gt;

&lt;p&gt;Full detail in log file.&lt;/p&gt;

&lt;p&gt;path failed at 14:46:50&lt;/p&gt;
&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;Feb 24 14:46:50 nbp9-oss5 OpenSM[4146]: SM port is down
Feb 24 14:46:50 nbp9-oss5 OpenSM[4146]: Entering DISCOVERING state
Feb 24 14:47:02 nbp9-oss5 run_srp_daemon[95911]: failed srp_daemon: [HCA=mlx4_1] [port=1] [exit status=110]. Will &lt;span class=&quot;code-keyword&quot;&gt;try&lt;/span&gt; to restart srp_daemon periodically. No more warnings will be issued in the next 7200 seconds &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; the same problem repeats
Feb 24 14:47:10 nbp9-oss5 run_srp_daemon[95917]: starting srp_daemon: [HCA=mlx4_1] [port=1]
Feb 24 14:47:18 nbp9-oss5 kernel: scsi host12: ib_srp: failed receive status 5
Feb 24 14:47:18 nbp9-oss5 kernel: scsi host12: ib_srp: failed receive status 5
.....
Feb 24 14:49:07 nbp9-oss5 kernel: INFO: task kmmpd-dm-20:20927 blocked &lt;span class=&quot;code-keyword&quot;&gt;for&lt;/span&gt; more than 120 seconds.
Feb 24 14:49:07 nbp9-oss5 kernel: &lt;span class=&quot;code-quote&quot;&gt;&quot;echo 0 &amp;gt; /proc/sys/kernel/hung_task_timeout_secs&quot;&lt;/span&gt; disables &lt;span class=&quot;code-keyword&quot;&gt;this&lt;/span&gt; message.
Feb 24 14:49:10 nbp9-oss5 kernel: kmmpd-dm-20   D 0000000000000000     0 20927      2 0x00000080
Feb 24 14:49:10 nbp9-oss5 kernel: ffff880aad5f7d20 0000000000000046 0000000000000000 ffffffffa001740c
Feb 24 14:49:10 nbp9-oss5 kernel: ffff880301b415c0 0000000000000008 0000000000007030 000000000fd00014
Feb 24 14:49:10 nbp9-oss5 kernel: ffff880aad45faf8 ffff880aad5f7fd8 000000000000fc40 ffff880aad45faf8
Feb 24 14:49:10 nbp9-oss5 kernel: Call Trace:
Feb 24 14:49:10 nbp9-oss5 kernel: [&amp;lt;ffffffffa001740c&amp;gt;] ? dm_table_unplug_all+0x5c/0x100 [dm_mod]
Feb 24 14:49:10 nbp9-oss5 kernel: [&amp;lt;ffffffff811b2c60&amp;gt;] ? sync_buffer+0x0/0x50
Feb 24 14:49:10 nbp9-oss5 kernel: [&amp;lt;ffffffff8153fe63&amp;gt;] io_schedule+0x73/0xc0
Feb 24 14:49:10 nbp9-oss5 kernel: [&amp;lt;ffffffff811b2ca0&amp;gt;] sync_buffer+0x40/0x50
Feb 24 14:49:10 nbp9-oss5 kernel: [&amp;lt;ffffffff8154081f&amp;gt;] __wait_on_bit+0x5f/0x90
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff811b2c60&amp;gt;] ? sync_buffer+0x0/0x50
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff815408c8&amp;gt;] out_of_line_wait_on_bit+0x78/0x90
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff81096350&amp;gt;] ? wake_bit_function+0x0/0x50
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff811b2c56&amp;gt;] __wait_on_buffer+0x26/0x30
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffffa0c9d40a&amp;gt;] write_mmp_block+0x5a/0x80 [ldiskfs]
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffffa0c9d955&amp;gt;] kmmpd+0x1a5/0x3b0 [ldiskfs]
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffffa0c9d7b0&amp;gt;] ? kmmpd+0x0/0x3b0 [ldiskfs]
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff81095fa6&amp;gt;] kthread+0x96/0xa0
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff8100c0ca&amp;gt;] child_rip+0xa/0x20
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff81095f10&amp;gt;] ? kthread+0x0/0xa0
Feb 24 14:49:11 nbp9-oss5 kernel: [&amp;lt;ffffffff8100c0c0&amp;gt;] ? child_rip+0x0/0x20
....
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>kernel 2.6.32-358.23.2.el6</environment>
        <key id="28850">LU-6286</key>
            <summary>During path failover KMMPD hangs updating mmp</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="6">Not a Bug</resolution>
                                        <assignee username="bfaccini">Bruno Faccini</assignee>
                                    <reporter username="mhanafi">Mahmoud Hanafi</reporter>
                        <labels>
                    </labels>
                <created>Wed, 25 Feb 2015 23:13:57 +0000</created>
                <updated>Thu, 15 Oct 2015 23:06:22 +0000</updated>
                            <resolved>Thu, 15 Oct 2015 23:06:22 +0000</resolved>
                                    <version>Lustre 2.4.3</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>4</watches>
                                                                            <comments>
                            <comment id="108091" author="bfaccini" created="Thu, 26 Feb 2015 12:58:10 +0000"  >&lt;p&gt;The full node&apos;s syslog you provided indicates that the IB/SRP path/devices have never recovered and thus the kmmpd/ost threads further hung stacks displayed should only be normal consequences.&lt;br/&gt;
This looks as some IB/SRP driver/device SW/HW/FW problem on the iopath upstream of Lustre layers.&lt;/p&gt;
</comment>
                            <comment id="130562" author="pjones" created="Thu, 15 Oct 2015 23:06:22 +0000"  >&lt;p&gt;As per NASA ok to close&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="17114" name="service165.gz" size="24079" author="mhanafi" created="Wed, 25 Feb 2015 23:13:57 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzx733:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>17618</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>