<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:15:45 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-1336] OSS GPF at ptlrpc_send_reply+0x470</title>
                <link>https://jira.whamcloud.com/browse/LU-1336</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;Back trace looks like this:&lt;/p&gt;


&lt;p&gt;machine_kexec&lt;br/&gt;
crash_kexec&lt;br/&gt;
oops_end&lt;br/&gt;
die&lt;br/&gt;
do_general_protection&lt;br/&gt;
general_protection&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;exception RIP: ptlrpc_send_replay+1136&amp;#93;&lt;/span&gt;&lt;br/&gt;
ptlrpc_send_error&lt;br/&gt;
target_send_replay_msg&lt;br/&gt;
target_send_reply&lt;br/&gt;
ost_handle&lt;br/&gt;
ptlrpc_main&lt;br/&gt;
kernel_thread&lt;/p&gt;

&lt;p&gt;That RIP resolves to lustre/ptlrpc/niobuf.c:436 which in our tree is here:&lt;/p&gt;


&lt;div class=&quot;code panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;codeContent panelContent&quot;&gt;
&lt;pre class=&quot;code-java&quot;&gt;434         &lt;span class=&quot;code-comment&quot;&gt;/* There may be no rq_export during failover */&lt;/span&gt;
435 
436         &lt;span class=&quot;code-keyword&quot;&gt;if&lt;/span&gt; (unlikely(req-&amp;gt;rq_export &amp;amp;&amp;amp; req-&amp;gt;rq_export-&amp;gt;exp_obd &amp;amp;&amp;amp;
437                      req-&amp;gt;rq_export-&amp;gt;exp_obd-&amp;gt;obd_fail)) { 
438                 &lt;span class=&quot;code-comment&quot;&gt;/* Failed obd&apos;s only send ENODEV */&lt;/span&gt;
439                 req-&amp;gt;rq_type = PTL_RPC_MSG_ERR;
440                 req-&amp;gt;rq_status = -ENODEV;
441                 CDEBUG(D_HA, &lt;span class=&quot;code-quote&quot;&gt;&quot;sending ENODEV from failed obd %d\n&quot;&lt;/span&gt;,
442                        req-&amp;gt;rq_export-&amp;gt;exp_obd-&amp;gt;obd_minor);
443         }
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Server was handling many client reconnects, under similar conditions as reported in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1085&quot; title=&quot;ASSERTION(cfs_atomic_read(&amp;amp;exp-&amp;gt;exp_refcount) == 0) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1085&quot;&gt;&lt;del&gt;LU-1085&lt;/del&gt;&lt;/a&gt;, &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1092&quot; title=&quot;NULL pointer dereference in filter_export_stats_init()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1092&quot;&gt;&lt;del&gt;LU-1092&lt;/del&gt;&lt;/a&gt;, &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1093&quot; title=&quot;unable to handle kernel paging request in target_handle_connect()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1093&quot;&gt;&lt;del&gt;LU-1093&lt;/del&gt;&lt;/a&gt;, and &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1094&quot; title=&quot;general protection fault in _debug_req()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1094&quot;&gt;&lt;del&gt;LU-1094&lt;/del&gt;&lt;/a&gt;.&lt;/p&gt;</description>
                <environment>&lt;a href=&quot;https://github.com/chaos/lustre/commits/2.1.0-24chaos&quot;&gt;https://github.com/chaos/lustre/commits/2.1.0-24chaos&lt;/a&gt;</environment>
        <key id="14108">LU-1336</key>
            <summary>OSS GPF at ptlrpc_send_reply+0x470</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="2" iconUrl="https://jira.whamcloud.com/images/icons/priorities/critical.svg">Critical</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="3">Duplicate</resolution>
                                        <assignee username="bobijam">Zhenyu Xu</assignee>
                                    <reporter username="nedbass">Ned Bass</reporter>
                        <labels>
                    </labels>
                <created>Wed, 18 Apr 2012 20:46:33 +0000</created>
                <updated>Mon, 30 Apr 2012 11:55:34 +0000</updated>
                            <resolved>Mon, 30 Apr 2012 11:55:34 +0000</resolved>
                                    <version>Lustre 2.1.0</version>
                                                        <due></due>
                            <votes>0</votes>
                                    <watches>2</watches>
                                                                            <comments>
                            <comment id="35069" author="pjones" created="Wed, 18 Apr 2012 21:28:10 +0000"  >&lt;p&gt;Bobi&lt;/p&gt;

&lt;p&gt;Could you please comment on this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="35072" author="tappro" created="Thu, 19 Apr 2012 02:01:04 +0000"  >&lt;p&gt;isn&apos;t that &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1092&quot; title=&quot;NULL pointer dereference in filter_export_stats_init()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1092&quot;&gt;&lt;del&gt;LU-1092&lt;/del&gt;&lt;/a&gt; which was landed:&lt;/p&gt;

&lt;p&gt;&lt;a href=&quot;http://git.whamcloud.com/?p=fs/lustre-release.git;a=commit;h=893cf2014a38c5bd94890d3522fafe55f024a958&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://git.whamcloud.com/?p=fs/lustre-release.git;a=commit;h=893cf2014a38c5bd94890d3522fafe55f024a958&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Also other &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1085&quot; title=&quot;ASSERTION(cfs_atomic_read(&amp;amp;exp-&amp;gt;exp_refcount) == 0) failed&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1085&quot;&gt;&lt;del&gt;LU-1085&lt;/del&gt;&lt;/a&gt;, &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1093&quot; title=&quot;unable to handle kernel paging request in target_handle_connect()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1093&quot;&gt;&lt;del&gt;LU-1093&lt;/del&gt;&lt;/a&gt; and &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1094&quot; title=&quot;general protection fault in _debug_req()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1094&quot;&gt;&lt;del&gt;LU-1094&lt;/del&gt;&lt;/a&gt; look like duplicates&lt;/p&gt;</comment>
                            <comment id="35091" author="nedbass" created="Thu, 19 Apr 2012 11:39:03 +0000"  >&lt;p&gt;Hi Mikhail,&lt;/p&gt;

&lt;p&gt;I&apos;ve been tracking those separately because the of the different exception sites.  That would be nice if they were all symptoms of the same bug.  &lt;/p&gt;

&lt;p&gt;Can we consider landing the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-1092&quot; title=&quot;NULL pointer dereference in filter_export_stats_init()&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-1092&quot;&gt;&lt;del&gt;LU-1092&lt;/del&gt;&lt;/a&gt; patch in 2.1?  These crashes are having a pretty big impact on our production systems.  Turning off OSS read cache seems to help avoid them, so we&apos;ve been leaving it turned off, but that has its own severe performance impacts for some workloads.  For now we&apos;ll cherry-pick the fix in our tree.&lt;/p&gt;</comment>
                            <comment id="35880" author="pjones" created="Mon, 30 Apr 2012 11:55:34 +0000"  >&lt;p&gt;Ned&lt;/p&gt;

&lt;p&gt;We have landed LU1092 for 2.1.2 also. Please reopen if this is not a duplicate after all&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                    </comments>
                    <attachments>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvh1r:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>6411</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>