<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:14:39 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1219] The connection is refused due to still busy with 1 active RPCs</title>
                <link>https://jira.whamcloud.com/browse/LU-1219</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>
&lt;p&gt;We got the following call traces at the customer site, and one OST refuses to connect due to still busy with 1 active RPCs.&lt;/p&gt;

&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;Mar 15 00:14:14 t2s007059 kernel: Pid: 13147, comm: ll_ost_io_229
Mar 15 00:14:14 t2s007059 kernel: 
Mar 15 00:14:14 t2s007059 kernel: Call Trace:
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff8002e024&amp;gt;] __wake_up+0x38/0x4f
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff889fc7f3&amp;gt;] jbd2_log_wait_commit+0xa3/0xf5 [jbd2]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff800a2dff&amp;gt;] autoremove_wake_function+0x0/0x2e
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88b1390b&amp;gt;] fsfilt_ldiskfs_commit_wait+0xab/0xd0 [fsfilt_ldiskfs]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88b54144&amp;gt;] filter_commitrw_write+0x1e14/0x2dd0 [obdfilter]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff886da3a6&amp;gt;] lnet_ni_send+0x96/0xe0 [lnet]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88aeeede&amp;gt;] ost_checksum_bulk+0x36e/0x5a0 [ost]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88af5d09&amp;gt;] ost_brw_write+0x1c99/0x2480 [ost]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887ebac8&amp;gt;] ptlrpc_send_reply+0x5e8/0x600 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887b68b0&amp;gt;] target_committed_to_req+0x40/0x120 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff8008e7f9&amp;gt;] default_wake_function+0x0/0xe
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887f00a8&amp;gt;] lustre_msg_check_version_v2+0x8/0x20 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88af909e&amp;gt;] ost_handle+0x2bae/0x55b0 [ost]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88741d00&amp;gt;] class_handle2object+0xe0/0x170 [obdclass]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887aa19a&amp;gt;] lock_res_and_lock+0xba/0xd0 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887af168&amp;gt;] __ldlm_handle2lock+0x2f8/0x360 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887ff6d9&amp;gt;] ptlrpc_server_handle_request+0x989/0xe00 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887ffe35&amp;gt;] ptlrpc_wait_event+0x2e5/0x310 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff8008cc1e&amp;gt;] __wake_up_common+0x3e/0x68
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff88800dc6&amp;gt;] ptlrpc_main+0xf66/0x1120 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff8005dfb1&amp;gt;] child_rip+0xa/0x11
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff887ffe60&amp;gt;] ptlrpc_main+0x0/0x1120 [ptlrpc]
Mar 15 00:14:14 t2s007059 kernel:  [&amp;lt;ffffffff8005dfa7&amp;gt;] child_rip+0x0/0x11
Mar 15 00:14:14 t2s007059 kernel: 
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;</description>
                <environment>server : lustre-1.8.7, client : lustre-1.8.4.ddn2.2</environment>
        <key id="13576">LU-1219</key>
            <summary>The connection is refused due to still busy with 1 active RPCs</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="4">Incomplete</resolution>
                                        <assignee username="hongchao.zhang">Hongchao Zhang</assignee>
                                    <reporter username="ihara">Shuichi Ihara</reporter>
                        <labels>
                    </labels>
                <created>Thu, 15 Mar 2012 01:15:52 +0000</created>
                <updated>Thu, 20 Dec 2012 14:29:34 +0000</updated>
                            <resolved>Thu, 20 Dec 2012 14:29:34 +0000</resolved>
                                    <version>Lustre 1.8.7</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>3</watches>
                                                                            <comments>
                            <comment id="31261" author="pjones" created="Thu, 15 Mar 2012 02:07:18 +0000"  >&lt;p&gt;Hongchao &lt;/p&gt;

&lt;p&gt;Could you please help with this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="31262" author="adilger" created="Thu, 15 Mar 2012 02:14:10 +0000"  >&lt;p&gt;This is possibly a duplicate of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-793&quot; title=&quot;Reconnections should not be refused when there is a request in progress from this client.&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-793&quot;&gt;&lt;del&gt;LU-793&lt;/del&gt;&lt;/a&gt;, for which Oleg already has a patch.&lt;/p&gt;</comment>
                            <comment id="31264" author="green" created="Thu, 15 Mar 2012 02:29:22 +0000"  >&lt;p&gt;The underlying issue is the write stuck in jbd somehow, &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-793&quot; title=&quot;Reconnections should not be refused when there is a request in progress from this client.&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-793&quot;&gt;&lt;del&gt;LU-793&lt;/del&gt;&lt;/a&gt; would not fix this, it just papers over some of the symptoms.&lt;/p&gt;</comment>
                            <comment id="31564" author="hongchao.zhang" created="Tue, 20 Mar 2012 02:00:13 +0000"  >&lt;p&gt;the journal is stuck when committing the previous transaction, was the info of process in this node available? &lt;br/&gt;
the stack trace of &quot;kjournald2&quot; should give some info about where it was stuck. thanks!&lt;/p&gt;</comment>
                            <comment id="31623" author="ihara" created="Tue, 20 Mar 2012 21:24:18 +0000"  >&lt;p&gt;Hongchao,&lt;/p&gt;

&lt;p&gt;Unfortunately, we only have /var/log/messages and /tmp/lustre-log.&amp;lt;timestamp&amp;gt;&lt;/p&gt;

&lt;p&gt;When if the problem happens again, we can collect all information you want.&lt;br/&gt;
Please let us know, what should we run the commands before reboot servers. &lt;/p&gt;</comment>
                            <comment id="32911" author="ihara" created="Fri, 30 Mar 2012 08:59:57 +0000"  >&lt;p&gt;Hi, &lt;br/&gt;
the customer is waiting for what they should get them when the same problem happens at the next time.&lt;br/&gt;
please let me know what exactly we should do.&lt;/p&gt;</comment>
                            <comment id="33045" author="hongchao.zhang" created="Sat, 31 Mar 2012 01:10:28 +0000"  >&lt;p&gt;Hi Shuichi&lt;/p&gt;

&lt;p&gt;Sorry for delayed response.&lt;br/&gt;
please get the thread info of tasks by sysrq (echo &quot;t&quot; &amp;gt;/proc/sysrq-trigger) of the node at where the OST resides,&lt;br/&gt;
and it&apos;s better to get the current running address of process &quot;kjournald2&quot; ATM, Thanks!&lt;/p&gt;</comment>
                            <comment id="49502" author="adilger" created="Thu, 20 Dec 2012 14:29:34 +0000"  >&lt;p&gt;Close this old issue until there is more information available.&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                            <attachment id="10954" name="messages.t2s007059" size="463925" author="ihara" created="Thu, 15 Mar 2012 01:15:52 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvh6v:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6434</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>