<!-- 
RSS generated by JIRA (9.4.14#940014-sha1:734e6822bbf0d45eff9af51f82432957f73aa32c) at Sat Feb 10 01:33:52 UTC 2024

It is possible to restrict the fields that are returned in this document by specifying the 'field' parameter in your request.
For example, to request only the issue key and summary append 'field=key&field=summary' to the URL of your request.
-->
<rss version="0.92" >
<channel>
    <title>Whamcloud Community JIRA</title>
    <link>https://jira.whamcloud.com</link>
    <description>This file is an XML representation of an issue</description>
    <language>en-us</language>    <build-info>
        <version>9.4.14</version>
        <build-number>940014</build-number>
        <build-date>05-12-2023</build-date>
    </build-info>


<item>
            <title>[LU-3433] Encountered a assertion for the ols_state being set to a impossible state</title>
                <link>https://jira.whamcloud.com/browse/LU-3433</link>
                <project id="10000" key="LU">Lustre</project>
                    <description>&lt;p&gt;During a test run using Lustre 2.4 one of our clients encountered this LBUG.&lt;/p&gt;

&lt;p&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt;LustreError:16573:0:(osc_lock.c:1165:osc_lock_enqueue()) ASSERTION( ols-&amp;gt;ols_state == OLS_NEW ) failed: Impossible state: 4&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt;LustreError: 16573:0&lt;br/&gt;
(osc_lock.c:1165:osc_lock_enqueue()) LBUG&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81006451&amp;gt;&amp;#93;&lt;/span&gt; try_stack_unwind+0x161/0x1a0&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81004ca9&amp;gt;&amp;#93;&lt;/span&gt; dump_trace+0x89/0x440&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa013a897&amp;gt;&amp;#93;&lt;/span&gt; libcfs_debug_dumpstack+0x57/0x80 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa013ade7&amp;gt;&amp;#93;&lt;/span&gt; lbug_with_loc+0x47/0xc0 &lt;span class=&quot;error&quot;&gt;&amp;#91;libcfs&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0639f55&amp;gt;&amp;#93;&lt;/span&gt; osc_lock_enqueue+0x725/0x8b0 &lt;span class=&quot;error&quot;&gt;&amp;#91;osc&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa032d4eb&amp;gt;&amp;#93;&lt;/span&gt; cl_enqueue_try+0xfb/0x320 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa06ccded&amp;gt;&amp;#93;&lt;/span&gt; lov_lock_enqueue+0x1fd/0x880 &lt;span class=&quot;error&quot;&gt;&amp;#91;lov&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa032d4eb&amp;gt;&amp;#93;&lt;/span&gt; cl_enqueue_try+0xfb/0x320 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa032e3bf&amp;gt;&amp;#93;&lt;/span&gt; cl_enqueue_locked+0x7f/0x1f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa032efbe&amp;gt;&amp;#93;&lt;/span&gt; cl_lock_request+0x7e/0x270 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa0334274&amp;gt;&amp;#93;&lt;/span&gt; cl_io_lock+0x394/0x5c0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa033453a&amp;gt;&amp;#93;&lt;/span&gt; cl_io_loop+0x9a/0x1a0 &lt;span class=&quot;error&quot;&gt;&amp;#91;obdclass&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa074b90f&amp;gt;&amp;#93;&lt;/span&gt; ll_file_io_generic+0x33f/0x5f0 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa074c08b&amp;gt;&amp;#93;&lt;/span&gt; ll_file_aio_read+0x23b/0x290 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffffa074d002&amp;gt;&amp;#93;&lt;/span&gt; ll_file_read+0x1f2/0x280 &lt;span class=&quot;error&quot;&gt;&amp;#91;lustre&amp;#93;&lt;/span&gt;&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81135548&amp;gt;&amp;#93;&lt;/span&gt; vfs_read+0xc8/0x180&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8113b799&amp;gt;&amp;#93;&lt;/span&gt; kernel_read+0x49/0x60&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8113b885&amp;gt;&amp;#93;&lt;/span&gt; prepare_binprm+0xd5/0x100&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8113c670&amp;gt;&amp;#93;&lt;/span&gt; do_execve_common+0x1c0/0x300&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8113c83f&amp;gt;&amp;#93;&lt;/span&gt; do_execve+0x3f/0x50&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff8100ae1e&amp;gt;&amp;#93;&lt;/span&gt; sys_execve+0x4e/0x80&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;ffffffff81316a3c&amp;gt;&amp;#93;&lt;/span&gt; stub_execve+0x6c/0xc0&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt; &lt;span class=&quot;error&quot;&gt;&amp;#91;&amp;lt;0000000020176437&amp;gt;&amp;#93;&lt;/span&gt; 0x20176437&lt;br/&gt;
&lt;span class=&quot;error&quot;&gt;&amp;#91;2013-05-29 18:39:47&amp;#93;&lt;/span&gt;&lt;span class=&quot;error&quot;&gt;&amp;#91;c7-1c1s3n3&amp;#93;&lt;/span&gt;Kernel panic - not syncing: LBUG&lt;/p&gt;</description>
                <environment>Cray Lustre 2.4 clients running on SLES11 SP2.</environment>
        <key id="19275">LU-3433</key>
            <summary>Encountered a assertion for the ols_state being set to a impossible state</summary>
                <type id="1" iconUrl="https://jira.whamcloud.com/secure/viewavatar?size=xsmall&amp;avatarId=11303&amp;avatarType=issuetype">Bug</type>
                                            <priority id="3" iconUrl="https://jira.whamcloud.com/images/icons/priorities/major.svg">Major</priority>
                        <status id="5" iconUrl="https://jira.whamcloud.com/images/icons/statuses/resolved.png" description="A resolution has been taken, and it is awaiting verification by reporter. From here issues are either reopened, or are closed.">Resolved</status>
                    <statusCategory id="3" key="done" colorName="success"/>
                                    <resolution id="1">Fixed</resolution>
                                        <assignee username="niu">Niu Yawei</assignee>
                                    <reporter username="simmonsja">James A Simmons</reporter>
                        <labels>
                            <label>mn4</label>
                    </labels>
                <created>Mon, 3 Jun 2013 13:56:17 +0000</created>
                <updated>Wed, 12 Nov 2014 18:07:18 +0000</updated>
                            <resolved>Thu, 20 Feb 2014 15:36:24 +0000</resolved>
                                    <version>Lustre 2.4.0</version>
                    <version>Lustre 2.4.1</version>
                                    <fixVersion>Lustre 2.5.0</fixVersion>
                                        <due></due>
                            <votes>0</votes>
                                    <watches>16</watches>
                                                                            <comments>
                            <comment id="59888" author="pjones" created="Mon, 3 Jun 2013 14:45:12 +0000"  >&lt;p&gt;Niu&lt;/p&gt;

&lt;p&gt;Could you please look into this one?&lt;/p&gt;

&lt;p&gt;Thanks&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                            <comment id="59901" author="paf" created="Mon, 3 Jun 2013 17:25:31 +0000"  >&lt;p&gt;Cray has recently noticed this LBUG while testing for a possible different source for the EINTR reported in &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;.  A reproducer very similar to that one can consistently produce this bug during writes or truncates.  I have not tested reads, but I&apos;m inclined to believe it would reproduce the bug for reads as well.&lt;/p&gt;

&lt;p&gt;I&apos;ll attach the reproducer for this bug for write/truncate.&lt;/p&gt;

&lt;p&gt;Briefly, the reproducer spawns a child thread, then the parent sets up a signal handler for SIGINT with SA_RESTART set, and loops the IO operation in question (It&apos;s set up for write or truncate, and could be modified to use read), while the child spams SIGINT at the parent.&lt;/p&gt;

&lt;p&gt;This bug is much easier to reproduce with +trace debugging enabled.  Without, it usually requires looping the reproducer, sometimes for several minutes.  The provided shell script loops the reproducer.&lt;/p&gt;</comment>
                            <comment id="59947" author="niu" created="Tue, 4 Jun 2013 09:41:17 +0000"  >&lt;p&gt;This looks like a regression introduced by &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;, when I removed the fix of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;, the LBUG can&apos;t be reproduced anymore, but I don&apos;t know the exact reason yet. Patrick, can you reproduce it after removing the fix of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;</comment>
                            <comment id="59957" author="simmonsja" created="Tue, 4 Jun 2013 12:11:54 +0000"  >&lt;p&gt;Do you have a reproducer for the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt; as well. It would be nice to make both conditions work.&lt;/p&gt;</comment>
                            <comment id="59963" author="paf" created="Tue, 4 Jun 2013 14:11:05 +0000"  >&lt;p&gt;James,&lt;/p&gt;

&lt;p&gt;It&apos;s the same reproducer, actually.  This one - as long as it&apos;s in write mode and not truncate &lt;span class=&quot;error&quot;&gt;&amp;#91;it might work in truncate, I haven&amp;#39;t tested&amp;#93;&lt;/span&gt; - should reproduce &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt; just fine.  All I changed was to tweak the timings to hit this LBUG more reliably.  Without the patch for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;, &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt; was quite easy to hit.&lt;/p&gt;

&lt;p&gt;Niu,&lt;/p&gt;

&lt;p&gt;I&apos;m not sure if I could reproduce it - I can try a bit later.  Without &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;, the system call is not restarted, because it returns EINTR.  That changes the timing and behavior profile immensely.  I don&apos;t think this was &apos;caused&apos; by &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt;, rather it was revealed by it.&lt;/p&gt;

&lt;p&gt;Presumably, when a system call is restarted, sometimes we wind up in this nasty state.  If EINTR is returned instead (&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3020&quot; title=&quot;Lustre returns EINTR during writes when SA_RESTART is set&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3020&quot;&gt;&lt;del&gt;LU-3020&lt;/del&gt;&lt;/a&gt; removed), then the system call is not restarted.  It&apos;s possible we only get to this state through restarting, or it&apos;s possible that we only get there through interrupting the system call at a very specific time, regardless of the restart behavior.&lt;/p&gt;

&lt;ul class=&quot;alternate&quot; type=&quot;square&quot;&gt;
	&lt;li&gt;Patrick&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="60200" author="paf" created="Fri, 7 Jun 2013 21:53:08 +0000"  >&lt;p&gt;Niu, James,&lt;/p&gt;

&lt;p&gt;We have a candidate patch for this from Xyratex that we&apos;re testing on our end.  It appears to resolve the issue, and once I&apos;m sure it&apos;s solid, we&apos;ll make sure it&apos;s pushed upstream.&lt;/p&gt;

&lt;ul class=&quot;alternate&quot; type=&quot;square&quot;&gt;
	&lt;li&gt;Patrick&lt;/li&gt;
&lt;/ul&gt;
</comment>
                            <comment id="60896" author="vitaly_fertman" created="Wed, 19 Jun 2013 22:30:38 +0000"  >&lt;p&gt;&lt;a href=&quot;http://review.whamcloud.com/6709&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/6709&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="65123" author="niu" created="Tue, 27 Aug 2013 02:55:59 +0000"  >&lt;p&gt;patch landed for 2.5&lt;/p&gt;</comment>
                            <comment id="73201" author="yujian" created="Tue, 10 Dec 2013 16:22:46 +0000"  >&lt;p&gt;Lustre Build: &lt;a href=&quot;http://build.whamcloud.com/job/lustre-b2_4/66/&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://build.whamcloud.com/job/lustre-b2_4/66/&lt;/a&gt;&lt;br/&gt;
Distro/Arch: RHEL6.4/x86_64&lt;/p&gt;

&lt;p&gt;The same failure occurred while running parallel-scale test write_disjoint:&lt;br/&gt;
&lt;a href=&quot;https://maloo.whamcloud.com/test_sets/e255840a-6193-11e3-a871-52540035b04c&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;https://maloo.whamcloud.com/test_sets/e255840a-6193-11e3-a871-52540035b04c&lt;/a&gt;&lt;/p&gt;

&lt;p&gt;Console log on client node:&lt;/p&gt;
&lt;div class=&quot;preformatted panel&quot; style=&quot;border-width: 1px;&quot;&gt;&lt;div class=&quot;preformattedContent panelContent&quot;&gt;
&lt;pre&gt;17:35:46:Lustre: DEBUG MARKER: == parallel-scale test write_disjoint: write_disjoint == 17:31:44 (1386639104)
17:35:46:LustreError: 12360:0:(osc_lock.c:1165:osc_lock_enqueue()) ASSERTION( ols-&amp;gt;ols_state == OLS_NEW ) failed: Impossible state: 6
17:35:46:LustreError: 12360:0:(osc_lock.c:1165:osc_lock_enqueue()) LBUG
17:35:46:Pid: 12360, comm: write_disjoint
17:35:47:
17:35:47:Call Trace:
17:35:47: [&amp;lt;ffffffffa19ac895&amp;gt;] libcfs_debug_dumpstack+0x55/0x80 [libcfs]
17:35:47: [&amp;lt;ffffffffa19ace97&amp;gt;] lbug_with_loc+0x47/0xb0 [libcfs]
17:35:47: [&amp;lt;ffffffffa05e4fc0&amp;gt;] ? osc_lock_enqueue+0x0/0x870 [osc]
17:35:47: [&amp;lt;ffffffffa05e5674&amp;gt;] osc_lock_enqueue+0x6b4/0x870 [osc]
17:35:47: [&amp;lt;ffffffffa19ad717&amp;gt;] ? cfs_waitq_broadcast+0x17/0x20 [libcfs]
17:35:47: [&amp;lt;ffffffffa1b15f5e&amp;gt;] ? cl_lock_state_signal+0x7e/0x160 [obdclass]
17:35:47: [&amp;lt;ffffffffa1b19d4c&amp;gt;] cl_enqueue_try+0xfc/0x300 [obdclass]
17:35:47: [&amp;lt;ffffffffa06620da&amp;gt;] lov_lock_enqueue+0x22a/0x850 [lov]
17:35:47: [&amp;lt;ffffffffa1b19d4c&amp;gt;] cl_enqueue_try+0xfc/0x300 [obdclass]
17:35:47: [&amp;lt;ffffffffa1b1b13f&amp;gt;] cl_enqueue_locked+0x6f/0x1f0 [obdclass]
17:35:47: [&amp;lt;ffffffffa1b1bdae&amp;gt;] cl_lock_request+0x7e/0x270 [obdclass]
17:35:47: [&amp;lt;ffffffffa1b2104c&amp;gt;] cl_io_lock+0x3cc/0x560 [obdclass]
17:35:48: [&amp;lt;ffffffffa1b21282&amp;gt;] cl_io_loop+0xa2/0x1b0 [obdclass]
17:35:48: [&amp;lt;ffffffffa06e09e0&amp;gt;] ll_file_io_generic+0x450/0x600 [lustre]
17:35:48: [&amp;lt;ffffffffa06e1922&amp;gt;] ll_file_aio_write+0x142/0x2c0 [lustre]
17:35:48: [&amp;lt;ffffffffa06e1c0c&amp;gt;] ll_file_write+0x16c/0x2a0 [lustre]
17:35:48: [&amp;lt;ffffffff81181398&amp;gt;] vfs_write+0xb8/0x1a0
17:35:48: [&amp;lt;ffffffff81181c91&amp;gt;] sys_write+0x51/0x90
17:35:48: [&amp;lt;ffffffff810dc685&amp;gt;] ? __audit_syscall_exit+0x265/0x290
17:35:48: [&amp;lt;ffffffff8100b072&amp;gt;] system_call_fastpath+0x16/0x1b
17:35:48:
17:35:48:Kernel panic - not syncing: LBUG
&lt;/pre&gt;
&lt;/div&gt;&lt;/div&gt;

&lt;p&gt;Patch back-ported to Lustre b2_4 branch: &lt;a href=&quot;http://review.whamcloud.com/8530&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8530&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="73653" author="yujian" created="Tue, 17 Dec 2013 06:07:14 +0000"  >&lt;p&gt;Patch landed on Lustre b2_4 branch for 2.4.2.&lt;/p&gt;</comment>
                            <comment id="73901" author="adilger" created="Thu, 19 Dec 2013 22:51:39 +0000"  >&lt;p&gt;Patch is being reverted from b2_4 due to test failures: &lt;a href=&quot;http://review.whamcloud.com/8621&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/8621&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="75943" author="morrone" created="Thu, 30 Jan 2014 21:23:41 +0000"  >&lt;p&gt;We saw the same assertion in production at LLNL with Lustre 2.4.0-19chaos.  Unfortunately it did not dump the backtrace to the console, and the crash dump failed.  But the assertion and particular unknown state (4) were the same as in this ticket, so I am assuming that it is the same bug.&lt;/p&gt;

&lt;p&gt;Since the fix needed to be reverted, it would appear that this issue needs to be reopened.&lt;/p&gt;</comment>
                            <comment id="76435" author="paf" created="Fri, 7 Feb 2014 05:05:24 +0000"  >&lt;p&gt;Christopher - I&apos;m not sure what exactly your 2.4.0-19 consists of, but Intel&apos;s 2.4.0 does not have this patch reverted.  Only if you&apos;re pulling updated sources from the b2.4 (or whatever it&apos;s called - sorry) branch in the repo, would you have the patch reverted.&lt;/p&gt;

&lt;p&gt;If you&apos;ve got 2.4.0 (or even 2.4.1, I believe), you wouldn&apos;t have the patch to begin with.&lt;/p&gt;</comment>
                            <comment id="76437" author="morrone" created="Fri, 7 Feb 2014 05:19:40 +0000"  >&lt;p&gt;Patrick - I understand that.  We hit the bug described in this ticket, not the bug caused by the fix for this ticket.  We would like to be able to cherry-pick the fix so that our client does not assert hit this bug, but if the patch needed to be reverted it is not yet safe for me to do so.&lt;/p&gt;
</comment>
                            <comment id="76527" author="niu" created="Sat, 8 Feb 2014 02:57:37 +0000"  >&lt;p&gt;The fix of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3889&quot; title=&quot; LBUG: (osc_lock.c:497:osc_lock_upcall()) ASSERTION( lock-&amp;gt;cll_state &amp;gt;= CLS_QUEUING ) &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3889&quot;&gt;&lt;del&gt;LU-3889&lt;/del&gt;&lt;/a&gt; has been landed on master &amp;amp; b2_5, it looks to me that we should just re-add this patch and backport the fix of &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3889&quot; title=&quot; LBUG: (osc_lock.c:497:osc_lock_upcall()) ASSERTION( lock-&amp;gt;cll_state &amp;gt;= CLS_QUEUING ) &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3889&quot;&gt;&lt;del&gt;LU-3889&lt;/del&gt;&lt;/a&gt; to b2_4.&lt;/p&gt;

&lt;p&gt;Bob, what&apos;s your opinion? I see the revert patch was uploaded by you, why we revert this patch instead of backport the &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3889&quot; title=&quot; LBUG: (osc_lock.c:497:osc_lock_upcall()) ASSERTION( lock-&amp;gt;cll_state &amp;gt;= CLS_QUEUING ) &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3889&quot;&gt;&lt;del&gt;LU-3889&lt;/del&gt;&lt;/a&gt;?&lt;/p&gt;</comment>
                            <comment id="76535" author="pjones" created="Sat, 8 Feb 2014 03:56:46 +0000"  >&lt;p&gt;Just timing. At the time the fix for &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3889&quot; title=&quot; LBUG: (osc_lock.c:497:osc_lock_upcall()) ASSERTION( lock-&amp;gt;cll_state &amp;gt;= CLS_QUEUING ) &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3889&quot;&gt;&lt;del&gt;LU-3889&lt;/del&gt;&lt;/a&gt; was unproven so reverting to the previous known state was preferable. I think that moving forward with both fixes is a sound approach.&lt;/p&gt;</comment>
                            <comment id="76563" author="niu" created="Mon, 10 Feb 2014 02:46:29 +0000"  >&lt;p&gt;ported &lt;a href=&quot;https://jira.whamcloud.com/browse/LU-3889&quot; title=&quot; LBUG: (osc_lock.c:497:osc_lock_upcall()) ASSERTION( lock-&amp;gt;cll_state &amp;gt;= CLS_QUEUING ) &quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-3889&quot;&gt;&lt;del&gt;LU-3889&lt;/del&gt;&lt;/a&gt; fix to b2_4: &lt;a href=&quot;http://review.whamcloud.com/9194&quot; class=&quot;external-link&quot; target=&quot;_blank&quot; rel=&quot;nofollow noopener&quot;&gt;http://review.whamcloud.com/9194&lt;/a&gt;&lt;/p&gt;</comment>
                            <comment id="80216" author="knweiss" created="Tue, 25 Mar 2014 14:29:44 +0000"  >&lt;p&gt;Niu/Peter, will this backport be merged into b2_4 (for 2.4.4)? I saw this bug on three lustre 2.4.2 clients and AFAIKS your patch is not included in 2.4.3 (we&apos;re using this version now) or b2_4.&lt;/p&gt;</comment>
                            <comment id="80217" author="pjones" created="Tue, 25 Mar 2014 14:33:30 +0000"  >&lt;p&gt;Karsten&lt;/p&gt;

&lt;p&gt;This would certainly be under consideration for a fuller 2.4.x maintenance release. 2.4.3 had limited content because it was an unscheduled release driven by the need to issue a 2.4.x release to address the security vulnerability discovered (&lt;a href=&quot;https://jira.whamcloud.com/browse/LU-4703&quot; title=&quot;setxattr(2) will succeed by a non root user, against a file the user doesn&amp;#39;t own.&quot; class=&quot;issue-link&quot; data-issue-key=&quot;LU-4703&quot;&gt;&lt;del&gt;LU-4703&lt;/del&gt;&lt;/a&gt;/4704)&lt;/p&gt;

&lt;p&gt;Peter&lt;/p&gt;</comment>
                    </comments>
                <issuelinks>
                            <issuelinktype id="10011">
                    <name>Related</name>
                                            <outwardlinks description="is related to ">
                                        <issuelink>
            <issuekey id="20796">LU-3889</issuekey>
        </issuelink>
            <issuelink>
            <issuekey id="18064">LU-3020</issuekey>
        </issuelink>
                            </outwardlinks>
                                                                <inwardlinks description="is related to">
                                        <issuelink>
            <issuekey id="27557">LU-5910</issuekey>
        </issuelink>
                            </inwardlinks>
                                    </issuelinktype>
                    </issuelinks>
                <attachments>
                            <attachment id="12982" name="test.sh" size="200" author="paf" created="Mon, 3 Jun 2013 17:26:40 +0000"/>
                            <attachment id="12983" name="write-eintr.c" size="3112" author="paf" created="Mon, 3 Jun 2013 17:26:40 +0000"/>
                    </attachments>
                <subtasks>
                    </subtasks>
                <customfields>
                                                                                                                                                                                            <customfield id="customfield_10890" key="com.atlassian.jira.plugins.jira-development-integration-plugin:devsummary">
                        <customfieldname>Development</customfieldname>
                        <customfieldvalues>
                            
                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        <customfield id="customfield_10390" key="com.pyxis.greenhopper.jira:gh-lexo-rank">
                        <customfieldname>Rank</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>1|hzvsov:</customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                <customfield id="customfield_10090" key="com.pyxis.greenhopper.jira:gh-global-rank">
                        <customfieldname>Rank (Obsolete)</customfieldname>
                        <customfieldvalues>
                            <customfieldvalue>8552</customfieldvalue>
                        </customfieldvalues>
                    </customfield>
                                                                                            <customfield id="customfield_10060" key="com.atlassian.jira.plugin.system.customfieldtypes:select">
                        <customfieldname>Severity</customfieldname>
                        <customfieldvalues>
                                <customfieldvalue key="10022"><![CDATA[3]]></customfieldvalue>

                        </customfieldvalues>
                    </customfield>
                                                                                                                                                                                                                                                                                                                                                        </customfields>
    </item>
</channel>
</rss>