<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:02:56 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-17] LBUG in ksocklnd</title>
                <link>https://jira.whamcloud.com/browse/LU-17</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;While testing iozone, a client hit this LBUG:&lt;/p&gt;

&lt;p&gt;Nov 18 15:43:53 psana0107 kernel: LustreError: 28278:0:(socklnd_cb.c:550:ksocknal_process_transmit()) ASSERTION(rc &amp;lt; 0) failed&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: LustreError: 28278:0:(socklnd_cb.c:550:ksocknal_process_transmit()) LBUG&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: Pid: 28278, comm: socknal_sd01&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: Call Trace:&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff884b56a1&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x51/0x60 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff884b5bda&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x7a/0xd0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff884bdf40&amp;gt;&amp;#93;&lt;/span&gt; tracefile_init+0x0/0x110 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff886a582a&amp;gt;&amp;#93;&lt;/span&gt; ksocknal_process_transmit+0x33a/0x640 &lt;span class=&quot;error&quot;&gt;&amp;#91;ksocklnd&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff886a75cb&amp;gt;&amp;#93;&lt;/span&gt; ksocknal_scheduler+0x38b/0x640 &lt;span class=&quot;error&quot;&gt;&amp;#91;ksocklnd&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff800a0abe&amp;gt;&amp;#93;&lt;/span&gt; autoremove_wake_function+0x0/0x2e&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005dfb1&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0xa/0x11&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff886a7240&amp;gt;&amp;#93;&lt;/span&gt; ksocknal_scheduler+0x0/0x640 &lt;span class=&quot;error&quot;&gt;&amp;#91;ksocklnd&amp;#93;&lt;/span&gt;&lt;br/&gt;
Nov 18 15:43:53 psana0107 kernel: &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8005dfa7&amp;gt;&amp;#93;&lt;/span&gt; child_rip+0x0/0x11&lt;/p&gt;

&lt;p&gt;Liang Zhen posted this patch in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15&quot; title=&quot;strange slow IO messages and bad performance &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15&quot;&gt;&lt;del&gt;LU-15&lt;/del&gt;&lt;/a&gt; originally:&lt;br/&gt;
&lt;a href=&quot;http://review.whamcloud.com/#change,127&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,127&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;This bug is to track work on that.&lt;/p&gt;</description>
                <environment></environment>
        <key id="10114">LU-17</key>
            <summary>LBUG in ksocklnd</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="4" iconUrl="https://jira.whamcloud.com/images/icons/priorities/minor.svg">Minor</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="liang">Liang Zhen</assignee>
                                    <reporter username="kitwestneat">Kit Westneat</reporter>
                        <labels>
                    </labels>
                <created>Mon, 22 Nov 2010 07:41:06 +0000</created>
                <updated>Thu, 3 Feb 2011 15:12:13 +0000</updated>
                            <resolved>Thu, 3 Feb 2011 15:12:13 +0000</resolved>
                                                                        <due></due>
                            <votes>0</votes>
                                    <watches>1</watches>
                                                                            <comments>
                            <comment id="10213" author="dferber" created="Mon, 22 Nov 2010 07:55:07 +0000"  >&lt;p&gt;Thanks Kit. I assigned to Liang as he is working on this. &lt;/p&gt;</comment>
                            <comment id="10214" author="rread" created="Mon, 22 Nov 2010 08:44:02 +0000"  >&lt;p&gt;Liang, please post the patch to a new bugzilla bug and request an inspection from Isaac.&lt;/p&gt;</comment>
                            <comment id="10222" author="dferber" created="Mon, 22 Nov 2010 16:34:33 +0000"  >&lt;p&gt;Cross referencing Liang&apos;s comment in bug &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-15&quot; title=&quot;strange slow IO messages and bad performance &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-15&quot;&gt;&lt;del&gt;LU-15&lt;/del&gt;&lt;/a&gt;, which Kit opened this &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-17&quot; title=&quot;LBUG in ksocklnd&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-17&quot;&gt;&lt;del&gt;LU-17&lt;/del&gt;&lt;/a&gt; bug up for:&lt;/p&gt;

&lt;p&gt;Liang Zhen added a comment - 18/Nov/10 8:06 PM&lt;br/&gt;
I&apos;ve posted patch on &lt;a href=&quot;http://review.whamcloud.com/#change,127&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/#change,127&lt;/a&gt;&lt;br/&gt;
(description of the patch should be &quot;fix contention on ksock_tx_t)&lt;/p&gt;

&lt;p&gt;Description of the problem:&lt;/p&gt;

&lt;p&gt;If the connection is closed before ksocknal_transmit() returns to ksocknal_process_transmit(), then nobody has refcount on conn::ksnc_sock and all pending ZC requests will be finalized by ksocknal_connsock_decref-&amp;gt;ksocknal_finalize_zcreq&lt;br/&gt;
ksocknal_finalize_zcreq will mark not-acked ZC request as error by setting tx::tx_reside = -1.&lt;br/&gt;
This is race because ksocknal_process_transmit() will check tx::tx_resid right after calling ksocknal_transmit(), and it can get&lt;br/&gt;
both tx-&amp;gt;tx_resid != 0 and rc == 0 then hit later LASSERT(rc &amp;lt; 0).&lt;br/&gt;
I&apos;ve added Jay and Lai as reviewer, also, I will file a bug on bugzilla and try to push it into mainstream.&lt;/p&gt;

&lt;p&gt;but this bug is not reason of bad performance, so we still need to survey on performance issue.&lt;/p&gt;

&lt;p&gt;Regards&lt;br/&gt;
Liang&lt;/p&gt;</comment>
                            <comment id="10223" author="liang" created="Mon, 22 Nov 2010 19:26:02 +0000"  >&lt;p&gt;I&apos;ve filed a bug on BZ and try to push it into mainstream&lt;br/&gt;
&lt;a href=&quot;https://bugzilla.lustre.org/show_bug.cgi?id=24218&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://bugzilla.lustre.org/show_bug.cgi?id=24218&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Regards&lt;br/&gt;
Liang&lt;/p&gt;</comment>
                            <comment id="10317" author="liang" created="Thu, 16 Dec 2010 20:57:39 +0000"  >&lt;p&gt;Patch landed on 2.x, still pending on test for 1.8&lt;/p&gt;</comment>
                            <comment id="10522" author="liang" created="Thu, 3 Feb 2011 15:12:13 +0000"  >&lt;p&gt;Patch landed on both 1.8.* and 2.*, mark it as resolved&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                    <customfield id="customfield_10020" key="com.atlassian.jira.plugin.system.customfieldtypes:float">
                        <customfieldname>Bugzilla ID</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>24218.0</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzw033:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>10093</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>